diff --git a/.gitattributes b/.gitattributes
index a6344aac8c09253b3b630fb776ae94478aa0275b..98870b57a7ecb3ffaf218590b389ba1bd19be488 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
+wandb/wandb/run-20251002_155442-6v8q0jgn/run-6v8q0jgn.wandb filter=lfs diff=lfs merge=lfs -text
diff --git a/eraser_flow_matching/step12000/config.yaml b/eraser_flow_matching/step12000/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..bcdc1e14f2d420fe1d72bf11ddd06055bee54a43
--- /dev/null
+++ b/eraser_flow_matching/step12000/config.yaml
@@ -0,0 +1,322 @@
+run_name: eraser_20251011_163756
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ ff_out_size: null
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ action_tokenizer:
+ identifier: physical-intelligence/fast
+ tokenizer_dir: null
+ action_dim: 7
+ horizon: 8
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: flow_matching
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: true
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: true
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: false
+lora_rank: 8
+lora_llm: false
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: a1_real_world
+ rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/eraser_flow_matching
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: eraser_20251011_163756
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/eraser_l1_regression/step12000-unsharded/config.yaml b/eraser_l1_regression/step12000-unsharded/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..a6f431bf4d5a0b20f2e83c546b4918beefe9339c
--- /dev/null
+++ b/eraser_l1_regression/step12000-unsharded/config.yaml
@@ -0,0 +1,322 @@
+run_name: eraser_20251011_163803
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ ff_out_size: null
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ action_tokenizer:
+ identifier: physical-intelligence/fast
+ tokenizer_dir: null
+ action_dim: 7
+ horizon: 8
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: l1_regression
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: true
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: true
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: false
+lora_rank: 8
+lora_llm: false
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: a1_real_world
+ rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/eraser_l1_regression
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: eraser_20251011_163803
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/eraser_l1_regression/step12000/config.yaml b/eraser_l1_regression/step12000/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..a6f431bf4d5a0b20f2e83c546b4918beefe9339c
--- /dev/null
+++ b/eraser_l1_regression/step12000/config.yaml
@@ -0,0 +1,322 @@
+run_name: eraser_20251011_163803
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ ff_out_size: null
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ action_tokenizer:
+ identifier: physical-intelligence/fast
+ tokenizer_dir: null
+ action_dim: 7
+ horizon: 8
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: l1_regression
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: true
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: true
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: false
+lora_rank: 8
+lora_llm: false
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: a1_real_world
+ rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/eraser_l1_regression
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: eraser_20251011_163803
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/eraser_l1_regression/wandb/wandb/debug-internal.log b/eraser_l1_regression/wandb/wandb/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..386717a53f873d08b6a50146f5882cde5ce853d2
--- /dev/null
+++ b/eraser_l1_regression/wandb/wandb/debug-internal.log
@@ -0,0 +1,12 @@
+{"time":"2025-10-11T16:38:45.369810639Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-11T16:38:46.624568558Z","level":"INFO","msg":"stream: created new stream","id":"qzez8pv7"}
+{"time":"2025-10-11T16:38:46.624626598Z","level":"INFO","msg":"stream: started","id":"qzez8pv7"}
+{"time":"2025-10-11T16:38:46.624662329Z","level":"INFO","msg":"sender: started","stream_id":"qzez8pv7"}
+{"time":"2025-10-11T16:38:46.624681929Z","level":"INFO","msg":"handler: started","stream_id":"qzez8pv7"}
+{"time":"2025-10-11T16:38:46.624653129Z","level":"INFO","msg":"writer: started","stream_id":"qzez8pv7"}
+{"time":"2025-10-11T20:03:56.095706913Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-10-13T02:33:28.920574862Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/qzez8pv7/file_stream","body":"\n
\n\n502 Server Error\n\n\nError: Server Error
\nThe server encountered a temporary error and could not complete your request.
Please try again in 30 seconds.\n
\n\n"}
+{"time":"2025-10-13T16:23:56.963675478Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-10-13T20:04:02.844107426Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-10-13T22:38:31.203849115Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
+{"time":"2025-10-14T15:32:47.24166171Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
diff --git a/eraser_l1_regression/wandb/wandb/debug.log b/eraser_l1_regression/wandb/wandb/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/files/requirements.txt b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8
--- /dev/null
+++ b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/files/requirements.txt
@@ -0,0 +1,286 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+et_xmlfile==2.0.0
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+openpyxl==3.1.5
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/files/wandb-metadata.json b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..b063f71559cb2ce24880c11879e497e0d37f94f0
--- /dev/null
+++ b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-10-11T16:38:44.897304Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/eraser_l1_regression",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "l1_regression",
+ "--seq_len",
+ "1600",
+ "--ft_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "16",
+ "--global_batch_size",
+ "126",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "eraser",
+ "--real_world_vla_config_path",
+ "vla_config_realworld/vla_config_eraser.yaml",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "7c171df5d31577ede69d05172c2bc62d42ef3e3d"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/eraser_l1_regression/wandb",
+ "host": "auh7-1b-gpu-252",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50572640256"
+ }
+ },
+ "memory": {
+ "total": "2434606936064"
+ },
+ "gpu_amd": [
+ {
+ "id": "2",
+ "uniqueId": "0xb1e32805d91e8fd",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0xf68552567a447d29",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0xb5f4e58f50394bbb",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0xfb9d87270270f7af",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0x558725d79035e281",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xedec3b515d1caf9",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0x651131bef1a09ac7",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0xd41cfefdcf23b69b",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1760459846",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "2286",
+ "job_name": "mh_eraser_l1_regression",
+ "job_nodelist": "auh7-1b-gpu-252",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1760200646",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "2286",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-252",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "579086",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-252",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "td93jux4p0c1uemtf61zmtfwi71qa2wt"
+}
\ No newline at end of file
diff --git a/glue/wandb/wandb/debug-internal.log b/glue/wandb/wandb/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..e42a40b41b0c9e340594ed1db9da0abd2fff3ae6
--- /dev/null
+++ b/glue/wandb/wandb/debug-internal.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:28:44.574145675Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-02T16:28:45.769098374Z","level":"INFO","msg":"stream: created new stream","id":"bzkyoc0w"}
+{"time":"2025-10-02T16:28:45.769135025Z","level":"INFO","msg":"stream: started","id":"bzkyoc0w"}
+{"time":"2025-10-02T16:28:45.769167365Z","level":"INFO","msg":"handler: started","stream_id":"bzkyoc0w"}
+{"time":"2025-10-02T16:28:45.769158745Z","level":"INFO","msg":"writer: started","stream_id":"bzkyoc0w"}
+{"time":"2025-10-02T16:28:45.769191036Z","level":"INFO","msg":"sender: started","stream_id":"bzkyoc0w"}
diff --git a/glue/wandb/wandb/debug.log b/glue/wandb/wandb/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/glue/wandb/wandb/run-20251002_162842-zmotbaex/files/output.log b/glue/wandb/wandb/run-20251002_162842-zmotbaex/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..e6ab11e70bbad95cbbfe78ebc574dda58846fb85
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162842-zmotbaex/files/output.log
@@ -0,0 +1,98 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+10/02 [16:28:44] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+10/02 [16:28:51] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130
+ INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue
+****** length of the dataset: 10316
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+10/02 [16:28:57] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=False, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* After get lora params successfully
+10/02 [16:30:16] INFO | >> Constructing optimizer with 2 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 36856
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=36,856
+ WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+10/02 [16:30:23] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py:967: UserWarning: The .grad attribute warnings.py:109
+ of a Tensor that is not a leaf Tensor is being accessed. Its .grad attribute won't be populated during autograd.backward(). If you indeed
+ want the .grad field to be populated for a non-leaf Tensor, use .retain_grad() on the non-leaf Tensor. If you access the non-leaf Tensor
+ by mistake, make sure you access the leaf Tensor instead. See github.com/pytorch/pytorch/pull/30531 for more informations. (Triggered
+ internally at /pytorch/build/aten/src/ATen/core/TensorBody.h:489.)
+ param_grad = param.grad
+
+[step=1/500000]
+ train/ActionNoiseL2Loss=1.834
+ throughput/total_tokens=192,000
+ System/Peak GPU Memory (MB)=39,644
+[step=2/500000]
+ train/ActionNoiseL2Loss=1.807
+ throughput/total_tokens=384,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=46,466
+[step=3/500000]
+ train/ActionNoiseL2Loss=1.699
+ throughput/total_tokens=576,000
+ throughput/device/tokens_per_second=975.1
+ throughput/device/batches_per_second=0.0406
+[step=4/500000]
+ train/ActionNoiseL2Loss=1.790
+ throughput/total_tokens=768,000
+ throughput/device/tokens_per_second=878.3
+ throughput/device/batches_per_second=0.0366
+[step=5/500000]
+ train/ActionNoiseL2Loss=1.693
+ throughput/total_tokens=960,000
+ throughput/device/tokens_per_second=830.7
+ throughput/device/batches_per_second=0.0346
+[step=6/500000]
+ train/ActionNoiseL2Loss=1.678
+ throughput/total_tokens=1,152,000
+ throughput/device/tokens_per_second=801.1
+ throughput/device/batches_per_second=0.0334
+[step=7/500000]
+ train/ActionNoiseL2Loss=1.561
+ throughput/total_tokens=1,344,000
+ throughput/device/tokens_per_second=779.7
+ throughput/device/batches_per_second=0.0325
diff --git a/glue/wandb/wandb/run-20251002_162842-zmotbaex/files/requirements.txt b/glue/wandb/wandb/run-20251002_162842-zmotbaex/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162842-zmotbaex/files/requirements.txt
@@ -0,0 +1,286 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+et_xmlfile==2.0.0
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+openpyxl==3.1.5
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/glue/wandb/wandb/run-20251002_162842-zmotbaex/files/wandb-metadata.json b/glue/wandb/wandb/run-20251002_162842-zmotbaex/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..101facbbf972f6cc4d941234dc09772af888bdbe
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162842-zmotbaex/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-10-02T16:28:42.692996Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "1600",
+ "--ft_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "16",
+ "--global_batch_size",
+ "126",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--real_world_vla_config_path",
+ "vla_config_realworld/vla_config_glue.yaml",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "5071f59d87c6a976691323cbac66d7a988b0b4e7"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue/wandb",
+ "host": "auh7-1b-gpu-260",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "56243372032"
+ }
+ },
+ "memory": {
+ "total": "2434606956544"
+ },
+ "gpu_amd": [
+ {
+ "id": "6",
+ "uniqueId": "0x2d75dae36f0dc353",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0xe35cdba2e3fafd21",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x4213cc9eeeefc98d",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0x702e8efb76b00c21",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0x4493708eee1ee737",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0x9815965a899d8053",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0xd7a6e11358a6574d",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0xd79d4a081e34548d",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1759681678",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "2259",
+ "job_name": "mh_glue_flow_matching",
+ "job_nodelist": "auh7-1b-gpu-260",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1759422478",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "2259",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-260",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "2571821",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-260",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "mkb2blj4w2h2y7he4b0dlo7b5hd3p38x"
+}
\ No newline at end of file
diff --git a/glue/wandb/wandb/run-20251002_162842-zmotbaex/logs/debug-core.log b/glue/wandb/wandb/run-20251002_162842-zmotbaex/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..fec31f7fb9916b6089ca3cc1a4986f779482f22d
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162842-zmotbaex/logs/debug-core.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:28:42.743912932Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpsh8i0z2c/port-2572010.txt","pid":2572010,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-10-02T16:28:42.744707722Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":2572010}
+{"time":"2025-10-02T16:28:42.744690061Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2572010-2572176-2097911213/socket","Net":"unix"}}
+{"time":"2025-10-02T16:28:42.92711156Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-10-02T16:28:42.933538707Z","level":"INFO","msg":"handleInformInit: received","streamId":"zmotbaex","id":"1(@)"}
+{"time":"2025-10-02T16:28:43.973148537Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"zmotbaex","id":"1(@)"}
diff --git a/glue/wandb/wandb/run-20251002_162842-zmotbaex/logs/debug-internal.log b/glue/wandb/wandb/run-20251002_162842-zmotbaex/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..b149f68c220a385066a78a83a8a465b361d70f08
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162842-zmotbaex/logs/debug-internal.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:28:42.93546825Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-02T16:28:43.973096137Z","level":"INFO","msg":"stream: created new stream","id":"zmotbaex"}
+{"time":"2025-10-02T16:28:43.973143067Z","level":"INFO","msg":"stream: started","id":"zmotbaex"}
+{"time":"2025-10-02T16:28:43.973152847Z","level":"INFO","msg":"writer: started","stream_id":"zmotbaex"}
+{"time":"2025-10-02T16:28:43.973166287Z","level":"INFO","msg":"sender: started","stream_id":"zmotbaex"}
+{"time":"2025-10-02T16:28:43.973210878Z","level":"INFO","msg":"handler: started","stream_id":"zmotbaex"}
diff --git a/glue/wandb/wandb/run-20251002_162842-zmotbaex/logs/debug.log b/glue/wandb/wandb/run-20251002_162842-zmotbaex/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/glue/wandb/wandb/run-20251002_162842-zmotbaex/run-zmotbaex.wandb b/glue/wandb/wandb/run-20251002_162842-zmotbaex/run-zmotbaex.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..81074005a62d1192a19ab6a8204e4f10b833bb1c
Binary files /dev/null and b/glue/wandb/wandb/run-20251002_162842-zmotbaex/run-zmotbaex.wandb differ
diff --git a/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/files/output.log b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..90a7192d1c8b3002647fb7d5abbc4c644d3f4f84
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/files/output.log
@@ -0,0 +1,107 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+10/02 [16:28:46] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+10/02 [16:28:51] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130
+ INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue
+****** length of the dataset: 10316
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+10/02 [16:28:57] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.model.layer_norm1.weight', 'action_head.model.layer_norm1.bias', 'action_head.model.fc1.weight', 'action_head.model.fc1.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.1.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.1.bias', 'action_head.model.layer_norm2.weight', 'action_head.model.layer_norm2.bias', 'action_head.model.fc2.weight', 'action_head.model.fc2.bias', 'proprio_projector.fc1.weight', 'proprio_projector.fc1.bias', 'proprio_projector.fc2.weight', 'proprio_projector.fc2.bias']
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=False, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* After get lora params successfully
+10/02 [16:30:26] INFO | >> Constructing optimizer with 2 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 35614
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=35,614
+10/02 [16:30:27] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+[step=1/500000]
+ train/ActionL1Loss=0.6604
+ throughput/total_tokens=192,000
+ System/Peak GPU Memory (MB)=40,144
+[step=2/500000]
+ train/ActionL1Loss=0.6686
+ throughput/total_tokens=384,000
+ throughput/device/tokens_per_second=1,212
+ throughput/device/batches_per_second=0.0505
+ System/Peak GPU Memory (MB)=46,917
+[step=3/500000]
+ train/ActionL1Loss=0.6331
+ throughput/total_tokens=576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4/500000]
+ train/ActionL1Loss=0.6222
+ throughput/total_tokens=768,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=5/500000]
+ train/ActionL1Loss=0.5780
+ throughput/total_tokens=960,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=6/500000]
+ train/ActionL1Loss=0.5804
+ throughput/total_tokens=1,152,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0490
+[step=7/500000]
+ train/ActionL1Loss=0.4998
+ throughput/total_tokens=1,344,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0490
+[step=8/500000]
+ train/ActionL1Loss=0.5153
+ throughput/total_tokens=1,536,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=9/500000]
+ train/ActionL1Loss=0.5447
+ throughput/total_tokens=1,728,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=10/500000]
+ train/ActionL1Loss=0.4229
+ throughput/total_tokens=1,920,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
diff --git a/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/files/requirements.txt b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/files/requirements.txt
@@ -0,0 +1,286 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+et_xmlfile==2.0.0
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+openpyxl==3.1.5
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/files/wandb-metadata.json b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..7498577dcd257ab91ffbcc21d1e52bfe1a1cda6e
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-10-02T16:28:44.296863Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "l1_regression",
+ "--seq_len",
+ "1600",
+ "--ft_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "16",
+ "--global_batch_size",
+ "126",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--real_world_vla_config_path",
+ "vla_config_realworld/vla_config_glue.yaml",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "5071f59d87c6a976691323cbac66d7a988b0b4e7"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue/wandb",
+ "host": "auh7-1b-gpu-282",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50534686720"
+ }
+ },
+ "memory": {
+ "total": "2434606956544"
+ },
+ "gpu_amd": [
+ {
+ "id": "1",
+ "uniqueId": "0x63f0fe2c43bc1640",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0x492f172b602a22b5",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0xcec181d5e2ce525",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xdaf531ba129c665e",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0x14a7fc56ac2e5e42",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0x1af77dc455975108",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xb66ccb62112b0571",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x2e7a3afcefcaca4b",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1759681678",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "2260",
+ "job_name": "mh_glue_l1_regression",
+ "job_nodelist": "auh7-1b-gpu-282",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1759422478",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "2260",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-282",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "3777115",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-282",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "065brkivq78b6pyeoha2ces6xhhdu5dv"
+}
\ No newline at end of file
diff --git a/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/logs/debug-core.log b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..2beae6d8861629a9a541fca159be5aeb6d90be82
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/logs/debug-core.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:28:44.546350644Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpduepwsd2/port-3777304.txt","pid":3777304,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-10-02T16:28:44.547929797Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3777304}
+{"time":"2025-10-02T16:28:44.549056273Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3777304-3777474-3243164877/socket","Net":"unix"}}
+{"time":"2025-10-02T16:28:44.556761474Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-10-02T16:28:44.572324418Z","level":"INFO","msg":"handleInformInit: received","streamId":"bzkyoc0w","id":"1(@)"}
+{"time":"2025-10-02T16:28:45.769139765Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"bzkyoc0w","id":"1(@)"}
diff --git a/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/logs/debug-internal.log b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..e42a40b41b0c9e340594ed1db9da0abd2fff3ae6
--- /dev/null
+++ b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/logs/debug-internal.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:28:44.574145675Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-02T16:28:45.769098374Z","level":"INFO","msg":"stream: created new stream","id":"bzkyoc0w"}
+{"time":"2025-10-02T16:28:45.769135025Z","level":"INFO","msg":"stream: started","id":"bzkyoc0w"}
+{"time":"2025-10-02T16:28:45.769167365Z","level":"INFO","msg":"handler: started","stream_id":"bzkyoc0w"}
+{"time":"2025-10-02T16:28:45.769158745Z","level":"INFO","msg":"writer: started","stream_id":"bzkyoc0w"}
+{"time":"2025-10-02T16:28:45.769191036Z","level":"INFO","msg":"sender: started","stream_id":"bzkyoc0w"}
diff --git a/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/logs/debug.log b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/run-bzkyoc0w.wandb b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/run-bzkyoc0w.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..9f9e21929b1578aa70ee6fab478a23e0c3e2830e
Binary files /dev/null and b/glue/wandb/wandb/run-20251002_162844-bzkyoc0w/run-bzkyoc0w.wandb differ
diff --git a/glue_flow_matching/step12000-unsharded/config.yaml b/glue_flow_matching/step12000-unsharded/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..0eaf5277b17fc477766981dbd3ab42f911d71658
--- /dev/null
+++ b/glue_flow_matching/step12000-unsharded/config.yaml
@@ -0,0 +1,322 @@
+run_name: glue_20251002_163658
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ ff_out_size: null
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ action_tokenizer:
+ identifier: physical-intelligence/fast
+ tokenizer_dir: null
+ action_dim: 7
+ horizon: 8
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: flow_matching
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: true
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: true
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: true
+lora_rank: 8
+lora_llm: false
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue_flow_matching
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: glue_20251002_163658
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/glue_flow_matching/step12000/config.yaml b/glue_flow_matching/step12000/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..0eaf5277b17fc477766981dbd3ab42f911d71658
--- /dev/null
+++ b/glue_flow_matching/step12000/config.yaml
@@ -0,0 +1,322 @@
+run_name: glue_20251002_163658
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ ff_out_size: null
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ action_tokenizer:
+ identifier: physical-intelligence/fast
+ tokenizer_dir: null
+ action_dim: 7
+ horizon: 8
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: flow_matching
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: true
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: true
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: true
+lora_rank: 8
+lora_llm: false
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue_flow_matching
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: glue_20251002_163658
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/glue_flow_matching/wandb/wandb/debug-internal.log b/glue_flow_matching/wandb/wandb/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..b6f233979d8d54643d262152a9e875cadf5086d3
--- /dev/null
+++ b/glue_flow_matching/wandb/wandb/debug-internal.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:37:29.207693207Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-02T16:37:30.340213302Z","level":"INFO","msg":"stream: created new stream","id":"tmwli25x"}
+{"time":"2025-10-02T16:37:30.340254592Z","level":"INFO","msg":"stream: started","id":"tmwli25x"}
+{"time":"2025-10-02T16:37:30.340274553Z","level":"INFO","msg":"writer: started","stream_id":"tmwli25x"}
+{"time":"2025-10-02T16:37:30.340287593Z","level":"INFO","msg":"handler: started","stream_id":"tmwli25x"}
+{"time":"2025-10-02T16:37:30.340319673Z","level":"INFO","msg":"sender: started","stream_id":"tmwli25x"}
diff --git a/glue_flow_matching/wandb/wandb/debug.log b/glue_flow_matching/wandb/wandb/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/files/output.log b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..451bbadc6d97edd88acc404b51c4448680f52631
--- /dev/null
+++ b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/files/output.log
@@ -0,0 +1,62686 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+10/02 [16:37:31] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+10/02 [16:37:42] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130
+10/02 [16:37:43] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue
+****** length of the dataset: 10316
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+10/02 [16:37:49] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=False, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* After get lora params successfully
+10/02 [16:39:07] INFO | >> Constructing optimizer with 2 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 36856
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=36,856
+10/02 [16:39:08] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+10/02 [16:39:15] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py:967: UserWarning: The .grad attribute warnings.py:109
+ of a Tensor that is not a leaf Tensor is being accessed. Its .grad attribute won't be populated during autograd.backward(). If you indeed
+ want the .grad field to be populated for a non-leaf Tensor, use .retain_grad() on the non-leaf Tensor. If you access the non-leaf Tensor
+ by mistake, make sure you access the leaf Tensor instead. See github.com/pytorch/pytorch/pull/30531 for more informations. (Triggered
+ internally at /pytorch/build/aten/src/ATen/core/TensorBody.h:489.)
+ param_grad = param.grad
+
+[step=1/500000]
+ train/ActionNoiseL2Loss=1.834
+ throughput/total_tokens=192,000
+ System/Peak GPU Memory (MB)=39,644
+[step=2/500000]
+ train/ActionNoiseL2Loss=1.807
+ throughput/total_tokens=384,000
+ throughput/device/tokens_per_second=1,196
+ throughput/device/batches_per_second=0.0499
+ System/Peak GPU Memory (MB)=46,466
+[step=3/500000]
+ train/ActionNoiseL2Loss=1.699
+ throughput/total_tokens=576,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=4/500000]
+ train/ActionNoiseL2Loss=1.790
+ throughput/total_tokens=768,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=5/500000]
+ train/ActionNoiseL2Loss=1.693
+ throughput/total_tokens=960,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=6/500000]
+ train/ActionNoiseL2Loss=1.678
+ throughput/total_tokens=1,152,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=7/500000]
+ train/ActionNoiseL2Loss=1.561
+ throughput/total_tokens=1,344,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=8/500000]
+ train/ActionNoiseL2Loss=1.604
+ throughput/total_tokens=1,536,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=9/500000]
+ train/ActionNoiseL2Loss=1.556
+ throughput/total_tokens=1,728,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=10/500000]
+ train/ActionNoiseL2Loss=1.506
+ throughput/total_tokens=1,920,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+ System/Peak GPU Memory (MB)=46,466
+[step=11/500000]
+ train/ActionNoiseL2Loss=1.537
+ throughput/total_tokens=2,112,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=12/500000]
+ train/ActionNoiseL2Loss=1.279
+ throughput/total_tokens=2,304,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=13/500000]
+ train/ActionNoiseL2Loss=1.478
+ throughput/total_tokens=2,496,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=14/500000]
+ train/ActionNoiseL2Loss=1.433
+ throughput/total_tokens=2,688,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=15/500000]
+ train/ActionNoiseL2Loss=1.288
+ throughput/total_tokens=2,880,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=16/500000]
+ train/ActionNoiseL2Loss=1.371
+ throughput/total_tokens=3,072,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=17/500000]
+ train/ActionNoiseL2Loss=1.353
+ throughput/total_tokens=3,264,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=18/500000]
+ train/ActionNoiseL2Loss=1.520
+ throughput/total_tokens=3,456,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=19/500000]
+ train/ActionNoiseL2Loss=1.306
+ throughput/total_tokens=3,648,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=20/500000]
+ optim/total_grad_norm=16.40
+ train/ActionNoiseL2Loss=1.323
+ throughput/total_tokens=3,840,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+ System/Peak GPU Memory (MB)=46,466
+[step=21/500000]
+ train/ActionNoiseL2Loss=1.404
+ throughput/total_tokens=4,032,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=22/500000]
+ train/ActionNoiseL2Loss=1.267
+ throughput/total_tokens=4,224,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=23/500000]
+ train/ActionNoiseL2Loss=1.393
+ throughput/total_tokens=4,416,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=24/500000]
+ train/ActionNoiseL2Loss=1.258
+ throughput/total_tokens=4,608,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=25/500000]
+ train/ActionNoiseL2Loss=1.194
+ throughput/total_tokens=4,800,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=26/500000]
+ train/ActionNoiseL2Loss=1.319
+ throughput/total_tokens=4,992,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=27/500000]
+ train/ActionNoiseL2Loss=1.215
+ throughput/total_tokens=5,184,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=28/500000]
+ train/ActionNoiseL2Loss=1.260
+ throughput/total_tokens=5,376,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=29/500000]
+ train/ActionNoiseL2Loss=1.131
+ throughput/total_tokens=5,568,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=30/500000]
+ train/ActionNoiseL2Loss=1.240
+ throughput/total_tokens=5,760,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,466
+[step=31/500000]
+ train/ActionNoiseL2Loss=1.086
+ throughput/total_tokens=5,952,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=32/500000]
+ train/ActionNoiseL2Loss=1.050
+ throughput/total_tokens=6,144,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=33/500000]
+ train/ActionNoiseL2Loss=1.266
+ throughput/total_tokens=6,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=34/500000]
+ train/ActionNoiseL2Loss=1.018
+ throughput/total_tokens=6,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=35/500000]
+ train/ActionNoiseL2Loss=1.007
+ throughput/total_tokens=6,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=36/500000]
+ train/ActionNoiseL2Loss=1.102
+ throughput/total_tokens=6,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=37/500000]
+ train/ActionNoiseL2Loss=1.091
+ throughput/total_tokens=7,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=38/500000]
+ train/ActionNoiseL2Loss=1.148
+ throughput/total_tokens=7,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=39/500000]
+ train/ActionNoiseL2Loss=0.9434
+ throughput/total_tokens=7,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=40/500000]
+ optim/total_grad_norm=13.83
+ train/ActionNoiseL2Loss=1.082
+ throughput/total_tokens=7,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,466
+[step=41/500000]
+ train/ActionNoiseL2Loss=0.8982
+ throughput/total_tokens=7,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=42/500000]
+ train/ActionNoiseL2Loss=1.019
+ throughput/total_tokens=8,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=43/500000]
+ train/ActionNoiseL2Loss=0.9823
+ throughput/total_tokens=8,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=44/500000]
+ train/ActionNoiseL2Loss=1.175
+ throughput/total_tokens=8,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=45/500000]
+ train/ActionNoiseL2Loss=1.020
+ throughput/total_tokens=8,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=46/500000]
+ train/ActionNoiseL2Loss=0.9180
+ throughput/total_tokens=8,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=47/500000]
+ train/ActionNoiseL2Loss=0.9789
+ throughput/total_tokens=9,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=48/500000]
+ train/ActionNoiseL2Loss=0.9764
+ throughput/total_tokens=9,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=49/500000]
+ train/ActionNoiseL2Loss=0.9196
+ throughput/total_tokens=9,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=50/500000]
+ train/ActionNoiseL2Loss=0.9288
+ throughput/total_tokens=9,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,466
+[step=51/500000]
+ train/ActionNoiseL2Loss=0.7798
+ throughput/total_tokens=9,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=52/500000]
+ train/ActionNoiseL2Loss=0.8925
+ throughput/total_tokens=9,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=53/500000]
+ train/ActionNoiseL2Loss=0.9779
+ throughput/total_tokens=10,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=54/500000]
+ train/ActionNoiseL2Loss=0.8652
+ throughput/total_tokens=10,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=55/500000]
+ train/ActionNoiseL2Loss=0.8910
+ throughput/total_tokens=10,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=56/500000]
+ train/ActionNoiseL2Loss=0.9522
+ throughput/total_tokens=10,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=57/500000]
+ train/ActionNoiseL2Loss=0.7966
+ throughput/total_tokens=10,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=58/500000]
+ train/ActionNoiseL2Loss=0.7912
+ throughput/total_tokens=11,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=59/500000]
+ train/ActionNoiseL2Loss=0.7167
+ throughput/total_tokens=11,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=60/500000]
+ optim/total_grad_norm=16.52
+ train/ActionNoiseL2Loss=0.7780
+ throughput/total_tokens=11,520,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=46,466
+[step=61/500000]
+ train/ActionNoiseL2Loss=0.9503
+ throughput/total_tokens=11,712,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=62/500000]
+ train/ActionNoiseL2Loss=0.7016
+ throughput/total_tokens=11,904,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=63/500000]
+ train/ActionNoiseL2Loss=0.8043
+ throughput/total_tokens=12,096,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=64/500000]
+ train/ActionNoiseL2Loss=0.7205
+ throughput/total_tokens=12,288,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=65/500000]
+ train/ActionNoiseL2Loss=0.7532
+ throughput/total_tokens=12,480,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=66/500000]
+ train/ActionNoiseL2Loss=0.7099
+ throughput/total_tokens=12,672,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=67/500000]
+ train/ActionNoiseL2Loss=0.7720
+ throughput/total_tokens=12,864,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=68/500000]
+ train/ActionNoiseL2Loss=0.7087
+ throughput/total_tokens=13,056,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=69/500000]
+ train/ActionNoiseL2Loss=0.7290
+ throughput/total_tokens=13,248,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=70/500000]
+ train/ActionNoiseL2Loss=0.6438
+ throughput/total_tokens=13,440,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=46,466
+[step=71/500000]
+ train/ActionNoiseL2Loss=0.6892
+ throughput/total_tokens=13,632,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=72/500000]
+ train/ActionNoiseL2Loss=0.6507
+ throughput/total_tokens=13,824,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=73/500000]
+ train/ActionNoiseL2Loss=0.6659
+ throughput/total_tokens=14,016,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=74/500000]
+ train/ActionNoiseL2Loss=0.5843
+ throughput/total_tokens=14,208,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=75/500000]
+ train/ActionNoiseL2Loss=0.6060
+ throughput/total_tokens=14,400,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=76/500000]
+ train/ActionNoiseL2Loss=0.6438
+ throughput/total_tokens=14,592,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=77/500000]
+ train/ActionNoiseL2Loss=0.5932
+ throughput/total_tokens=14,784,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=78/500000]
+ train/ActionNoiseL2Loss=0.5630
+ throughput/total_tokens=14,976,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=79/500000]
+ train/ActionNoiseL2Loss=0.5606
+ throughput/total_tokens=15,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=80/500000]
+ optim/total_grad_norm=11.11
+ train/ActionNoiseL2Loss=0.5712
+ throughput/total_tokens=15,360,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=46,466
+[step=81/500000]
+ train/ActionNoiseL2Loss=0.5985
+ throughput/total_tokens=15,552,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=82/500000]
+ train/ActionNoiseL2Loss=0.5204
+ throughput/total_tokens=15,744,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=83/500000]
+ train/ActionNoiseL2Loss=0.5452
+ throughput/total_tokens=15,936,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=84/500000]
+ train/ActionNoiseL2Loss=0.5178
+ throughput/total_tokens=16,128,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=85/500000]
+ train/ActionNoiseL2Loss=0.7087
+ throughput/total_tokens=16,320,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=86/500000]
+ train/ActionNoiseL2Loss=0.4645
+ throughput/total_tokens=16,512,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=87/500000]
+ train/ActionNoiseL2Loss=0.5340
+ throughput/total_tokens=16,704,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=88/500000]
+ train/ActionNoiseL2Loss=0.5375
+ throughput/total_tokens=16,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=89/500000]
+ train/ActionNoiseL2Loss=0.4528
+ throughput/total_tokens=17,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=90/500000]
+ train/ActionNoiseL2Loss=0.4476
+ throughput/total_tokens=17,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+ System/Peak GPU Memory (MB)=46,466
+[step=91/500000]
+ train/ActionNoiseL2Loss=0.5516
+ throughput/total_tokens=17,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=92/500000]
+ train/ActionNoiseL2Loss=0.4508
+ throughput/total_tokens=17,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=93/500000]
+ train/ActionNoiseL2Loss=0.5046
+ throughput/total_tokens=17,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=94/500000]
+ train/ActionNoiseL2Loss=0.5223
+ throughput/total_tokens=18,048,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=95/500000]
+ train/ActionNoiseL2Loss=0.5136
+ throughput/total_tokens=18,240,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=96/500000]
+ train/ActionNoiseL2Loss=0.5097
+ throughput/total_tokens=18,432,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=97/500000]
+ train/ActionNoiseL2Loss=0.4889
+ throughput/total_tokens=18,624,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=98/500000]
+ train/ActionNoiseL2Loss=0.5675
+ throughput/total_tokens=18,816,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0473
+[step=99/500000]
+ train/ActionNoiseL2Loss=0.4163
+ throughput/total_tokens=19,008,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=100/500000]
+ optim/total_grad_norm=9.989
+ train/ActionNoiseL2Loss=0.4979
+ throughput/total_tokens=19,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=101/500000]
+ train/ActionNoiseL2Loss=0.4766
+ throughput/total_tokens=19,392,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=102/500000]
+ train/ActionNoiseL2Loss=0.4478
+ throughput/total_tokens=19,584,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=103/500000]
+ train/ActionNoiseL2Loss=0.4226
+ throughput/total_tokens=19,776,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=104/500000]
+ train/ActionNoiseL2Loss=0.4882
+ throughput/total_tokens=19,968,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=105/500000]
+ train/ActionNoiseL2Loss=0.4806
+ throughput/total_tokens=20,160,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=106/500000]
+ train/ActionNoiseL2Loss=0.3879
+ throughput/total_tokens=20,352,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=107/500000]
+ train/ActionNoiseL2Loss=0.3885
+ throughput/total_tokens=20,544,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=108/500000]
+ train/ActionNoiseL2Loss=0.4721
+ throughput/total_tokens=20,736,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=109/500000]
+ train/ActionNoiseL2Loss=0.4511
+ throughput/total_tokens=20,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=110/500000]
+ train/ActionNoiseL2Loss=0.3504
+ throughput/total_tokens=21,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=46,466
+[step=111/500000]
+ train/ActionNoiseL2Loss=0.3771
+ throughput/total_tokens=21,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=112/500000]
+ train/ActionNoiseL2Loss=0.4994
+ throughput/total_tokens=21,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=113/500000]
+ train/ActionNoiseL2Loss=0.3385
+ throughput/total_tokens=21,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=114/500000]
+ train/ActionNoiseL2Loss=0.4730
+ throughput/total_tokens=21,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=115/500000]
+ train/ActionNoiseL2Loss=0.5198
+ throughput/total_tokens=22,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=116/500000]
+ train/ActionNoiseL2Loss=0.3421
+ throughput/total_tokens=22,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=117/500000]
+ train/ActionNoiseL2Loss=0.3769
+ throughput/total_tokens=22,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=118/500000]
+ train/ActionNoiseL2Loss=0.4950
+ throughput/total_tokens=22,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=119/500000]
+ train/ActionNoiseL2Loss=0.3880
+ throughput/total_tokens=22,848,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=120/500000]
+ optim/total_grad_norm=12.74
+ train/ActionNoiseL2Loss=0.4508
+ throughput/total_tokens=23,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=121/500000]
+ train/ActionNoiseL2Loss=0.3989
+ throughput/total_tokens=23,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=122/500000]
+ train/ActionNoiseL2Loss=0.4078
+ throughput/total_tokens=23,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=123/500000]
+ train/ActionNoiseL2Loss=0.4432
+ throughput/total_tokens=23,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=124/500000]
+ train/ActionNoiseL2Loss=0.4540
+ throughput/total_tokens=23,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=125/500000]
+ train/ActionNoiseL2Loss=0.2944
+ throughput/total_tokens=24,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=126/500000]
+ train/ActionNoiseL2Loss=0.4083
+ throughput/total_tokens=24,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=127/500000]
+ train/ActionNoiseL2Loss=0.4015
+ throughput/total_tokens=24,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=128/500000]
+ train/ActionNoiseL2Loss=0.5455
+ throughput/total_tokens=24,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=129/500000]
+ train/ActionNoiseL2Loss=0.4035
+ throughput/total_tokens=24,768,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=130/500000]
+ train/ActionNoiseL2Loss=0.3457
+ throughput/total_tokens=24,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=131/500000]
+ train/ActionNoiseL2Loss=0.4458
+ throughput/total_tokens=25,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=132/500000]
+ train/ActionNoiseL2Loss=0.3407
+ throughput/total_tokens=25,344,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=133/500000]
+ train/ActionNoiseL2Loss=0.4237
+ throughput/total_tokens=25,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=134/500000]
+ train/ActionNoiseL2Loss=0.3580
+ throughput/total_tokens=25,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=135/500000]
+ train/ActionNoiseL2Loss=0.4333
+ throughput/total_tokens=25,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=136/500000]
+ train/ActionNoiseL2Loss=0.3826
+ throughput/total_tokens=26,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=137/500000]
+ train/ActionNoiseL2Loss=0.4427
+ throughput/total_tokens=26,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=138/500000]
+ train/ActionNoiseL2Loss=0.4238
+ throughput/total_tokens=26,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=139/500000]
+ train/ActionNoiseL2Loss=0.3519
+ throughput/total_tokens=26,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=140/500000]
+ optim/total_grad_norm=25.76
+ train/ActionNoiseL2Loss=0.4200
+ throughput/total_tokens=26,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=141/500000]
+ train/ActionNoiseL2Loss=0.3026
+ throughput/total_tokens=27,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=142/500000]
+ train/ActionNoiseL2Loss=0.3159
+ throughput/total_tokens=27,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=143/500000]
+ train/ActionNoiseL2Loss=0.3343
+ throughput/total_tokens=27,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=144/500000]
+ train/ActionNoiseL2Loss=0.3778
+ throughput/total_tokens=27,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=145/500000]
+ train/ActionNoiseL2Loss=0.4359
+ throughput/total_tokens=27,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=146/500000]
+ train/ActionNoiseL2Loss=0.3617
+ throughput/total_tokens=28,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=147/500000]
+ train/ActionNoiseL2Loss=0.3088
+ throughput/total_tokens=28,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=148/500000]
+ train/ActionNoiseL2Loss=0.2733
+ throughput/total_tokens=28,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=149/500000]
+ train/ActionNoiseL2Loss=0.3230
+ throughput/total_tokens=28,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=150/500000]
+ train/ActionNoiseL2Loss=0.3560
+ throughput/total_tokens=28,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=151/500000]
+ train/ActionNoiseL2Loss=0.3144
+ throughput/total_tokens=28,992,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=152/500000]
+ train/ActionNoiseL2Loss=0.4442
+ throughput/total_tokens=29,184,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=153/500000]
+ train/ActionNoiseL2Loss=0.3982
+ throughput/total_tokens=29,376,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=154/500000]
+ train/ActionNoiseL2Loss=0.3358
+ throughput/total_tokens=29,568,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=155/500000]
+ train/ActionNoiseL2Loss=0.4131
+ throughput/total_tokens=29,760,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=156/500000]
+ train/ActionNoiseL2Loss=0.2940
+ throughput/total_tokens=29,952,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=157/500000]
+ train/ActionNoiseL2Loss=0.5577
+ throughput/total_tokens=30,144,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=158/500000]
+ train/ActionNoiseL2Loss=0.2906
+ throughput/total_tokens=30,336,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=159/500000]
+ train/ActionNoiseL2Loss=0.2970
+ throughput/total_tokens=30,528,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=160/500000]
+ optim/total_grad_norm=10.24
+ train/ActionNoiseL2Loss=0.3998
+ throughput/total_tokens=30,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=46,466
+[step=161/500000]
+ train/ActionNoiseL2Loss=0.4295
+ throughput/total_tokens=30,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=162/500000]
+ train/ActionNoiseL2Loss=0.2536
+ throughput/total_tokens=31,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=163/500000]
+ train/ActionNoiseL2Loss=0.3206
+ throughput/total_tokens=31,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=164/500000]
+ train/ActionNoiseL2Loss=0.4237
+ throughput/total_tokens=31,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=165/500000]
+ train/ActionNoiseL2Loss=0.4070
+ throughput/total_tokens=31,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=166/500000]
+ train/ActionNoiseL2Loss=0.3169
+ throughput/total_tokens=31,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=167/500000]
+ train/ActionNoiseL2Loss=0.3135
+ throughput/total_tokens=32,064,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=168/500000]
+ train/ActionNoiseL2Loss=0.3783
+ throughput/total_tokens=32,256,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=169/500000]
+ train/ActionNoiseL2Loss=0.3614
+ throughput/total_tokens=32,448,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=170/500000]
+ train/ActionNoiseL2Loss=0.3216
+ throughput/total_tokens=32,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=171/500000]
+ train/ActionNoiseL2Loss=0.3545
+ throughput/total_tokens=32,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=172/500000]
+ train/ActionNoiseL2Loss=0.2900
+ throughput/total_tokens=33,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=173/500000]
+ train/ActionNoiseL2Loss=0.2834
+ throughput/total_tokens=33,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=174/500000]
+ train/ActionNoiseL2Loss=0.3834
+ throughput/total_tokens=33,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=175/500000]
+ train/ActionNoiseL2Loss=0.4440
+ throughput/total_tokens=33,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=176/500000]
+ train/ActionNoiseL2Loss=0.3212
+ throughput/total_tokens=33,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=177/500000]
+ train/ActionNoiseL2Loss=0.2958
+ throughput/total_tokens=33,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=178/500000]
+ train/ActionNoiseL2Loss=0.4541
+ throughput/total_tokens=34,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=179/500000]
+ train/ActionNoiseL2Loss=0.3694
+ throughput/total_tokens=34,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=180/500000]
+ optim/total_grad_norm=8.388
+ train/ActionNoiseL2Loss=0.2357
+ throughput/total_tokens=34,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=181/500000]
+ train/ActionNoiseL2Loss=0.2931
+ throughput/total_tokens=34,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=182/500000]
+ train/ActionNoiseL2Loss=0.3101
+ throughput/total_tokens=34,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=183/500000]
+ train/ActionNoiseL2Loss=0.4172
+ throughput/total_tokens=35,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=184/500000]
+ train/ActionNoiseL2Loss=0.3606
+ throughput/total_tokens=35,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=185/500000]
+ train/ActionNoiseL2Loss=0.3948
+ throughput/total_tokens=35,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=186/500000]
+ train/ActionNoiseL2Loss=0.3091
+ throughput/total_tokens=35,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=187/500000]
+ train/ActionNoiseL2Loss=0.2512
+ throughput/total_tokens=35,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=188/500000]
+ train/ActionNoiseL2Loss=0.3056
+ throughput/total_tokens=36,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=189/500000]
+ train/ActionNoiseL2Loss=0.4531
+ throughput/total_tokens=36,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=190/500000]
+ train/ActionNoiseL2Loss=0.2501
+ throughput/total_tokens=36,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=191/500000]
+ train/ActionNoiseL2Loss=0.2584
+ throughput/total_tokens=36,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=192/500000]
+ train/ActionNoiseL2Loss=0.2749
+ throughput/total_tokens=36,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=193/500000]
+ train/ActionNoiseL2Loss=0.2238
+ throughput/total_tokens=37,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=194/500000]
+ train/ActionNoiseL2Loss=0.2902
+ throughput/total_tokens=37,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=195/500000]
+ train/ActionNoiseL2Loss=0.3352
+ throughput/total_tokens=37,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=196/500000]
+ train/ActionNoiseL2Loss=0.2514
+ throughput/total_tokens=37,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=197/500000]
+ train/ActionNoiseL2Loss=0.3044
+ throughput/total_tokens=37,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=198/500000]
+ train/ActionNoiseL2Loss=0.2590
+ throughput/total_tokens=38,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=199/500000]
+ train/ActionNoiseL2Loss=0.2817
+ throughput/total_tokens=38,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=200/500000]
+ optim/total_grad_norm=8.081
+ train/ActionNoiseL2Loss=0.2272
+ throughput/total_tokens=38,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=201/500000]
+ train/ActionNoiseL2Loss=0.2507
+ throughput/total_tokens=38,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=202/500000]
+ train/ActionNoiseL2Loss=0.3842
+ throughput/total_tokens=38,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=203/500000]
+ train/ActionNoiseL2Loss=0.2665
+ throughput/total_tokens=38,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=204/500000]
+ train/ActionNoiseL2Loss=0.2775
+ throughput/total_tokens=39,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=205/500000]
+ train/ActionNoiseL2Loss=0.2497
+ throughput/total_tokens=39,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=206/500000]
+ train/ActionNoiseL2Loss=0.2654
+ throughput/total_tokens=39,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=207/500000]
+ train/ActionNoiseL2Loss=0.3491
+ throughput/total_tokens=39,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=208/500000]
+ train/ActionNoiseL2Loss=0.3331
+ throughput/total_tokens=39,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=209/500000]
+ train/ActionNoiseL2Loss=0.2996
+ throughput/total_tokens=40,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=210/500000]
+ train/ActionNoiseL2Loss=0.2382
+ throughput/total_tokens=40,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=46,466
+[step=211/500000]
+ train/ActionNoiseL2Loss=0.3972
+ throughput/total_tokens=40,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=212/500000]
+ train/ActionNoiseL2Loss=0.3004
+ throughput/total_tokens=40,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=213/500000]
+ train/ActionNoiseL2Loss=0.2708
+ throughput/total_tokens=40,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=214/500000]
+ train/ActionNoiseL2Loss=0.2475
+ throughput/total_tokens=41,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=215/500000]
+ train/ActionNoiseL2Loss=0.3061
+ throughput/total_tokens=41,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=216/500000]
+ train/ActionNoiseL2Loss=0.3468
+ throughput/total_tokens=41,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=217/500000]
+ train/ActionNoiseL2Loss=0.2352
+ throughput/total_tokens=41,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=218/500000]
+ train/ActionNoiseL2Loss=0.2783
+ throughput/total_tokens=41,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=219/500000]
+ train/ActionNoiseL2Loss=0.2596
+ throughput/total_tokens=42,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=220/500000]
+ optim/total_grad_norm=10.34
+ train/ActionNoiseL2Loss=0.3162
+ throughput/total_tokens=42,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=221/500000]
+ train/ActionNoiseL2Loss=0.1944
+ throughput/total_tokens=42,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=222/500000]
+ train/ActionNoiseL2Loss=0.2874
+ throughput/total_tokens=42,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=223/500000]
+ train/ActionNoiseL2Loss=0.1930
+ throughput/total_tokens=42,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=224/500000]
+ train/ActionNoiseL2Loss=0.1822
+ throughput/total_tokens=43,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=225/500000]
+ train/ActionNoiseL2Loss=0.2357
+ throughput/total_tokens=43,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=226/500000]
+ train/ActionNoiseL2Loss=0.3190
+ throughput/total_tokens=43,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=227/500000]
+ train/ActionNoiseL2Loss=0.2700
+ throughput/total_tokens=43,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=228/500000]
+ train/ActionNoiseL2Loss=0.2576
+ throughput/total_tokens=43,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=229/500000]
+ train/ActionNoiseL2Loss=0.3119
+ throughput/total_tokens=43,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=230/500000]
+ train/ActionNoiseL2Loss=0.2470
+ throughput/total_tokens=44,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=231/500000]
+ train/ActionNoiseL2Loss=0.2787
+ throughput/total_tokens=44,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=232/500000]
+ train/ActionNoiseL2Loss=0.2131
+ throughput/total_tokens=44,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=233/500000]
+ train/ActionNoiseL2Loss=0.2140
+ throughput/total_tokens=44,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=234/500000]
+ train/ActionNoiseL2Loss=0.2790
+ throughput/total_tokens=44,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=235/500000]
+ train/ActionNoiseL2Loss=0.2841
+ throughput/total_tokens=45,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=236/500000]
+ train/ActionNoiseL2Loss=0.3142
+ throughput/total_tokens=45,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=237/500000]
+ train/ActionNoiseL2Loss=0.2968
+ throughput/total_tokens=45,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=238/500000]
+ train/ActionNoiseL2Loss=0.2917
+ throughput/total_tokens=45,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=239/500000]
+ train/ActionNoiseL2Loss=0.1781
+ throughput/total_tokens=45,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=240/500000]
+ optim/total_grad_norm=11.27
+ train/ActionNoiseL2Loss=0.2748
+ throughput/total_tokens=46,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=241/500000]
+ train/ActionNoiseL2Loss=0.3014
+ throughput/total_tokens=46,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=242/500000]
+ train/ActionNoiseL2Loss=0.3019
+ throughput/total_tokens=46,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=243/500000]
+ train/ActionNoiseL2Loss=0.2683
+ throughput/total_tokens=46,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=244/500000]
+ train/ActionNoiseL2Loss=0.2722
+ throughput/total_tokens=46,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=245/500000]
+ train/ActionNoiseL2Loss=0.2566
+ throughput/total_tokens=47,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=246/500000]
+ train/ActionNoiseL2Loss=0.2345
+ throughput/total_tokens=47,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=247/500000]
+ train/ActionNoiseL2Loss=0.2830
+ throughput/total_tokens=47,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=248/500000]
+ train/ActionNoiseL2Loss=0.2402
+ throughput/total_tokens=47,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=249/500000]
+ train/ActionNoiseL2Loss=0.3322
+ throughput/total_tokens=47,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=250/500000]
+ train/ActionNoiseL2Loss=0.1921
+ throughput/total_tokens=48,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=251/500000]
+ train/ActionNoiseL2Loss=0.2068
+ throughput/total_tokens=48,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=252/500000]
+ train/ActionNoiseL2Loss=0.1653
+ throughput/total_tokens=48,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=253/500000]
+ train/ActionNoiseL2Loss=0.2295
+ throughput/total_tokens=48,576,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=254/500000]
+ train/ActionNoiseL2Loss=0.2099
+ throughput/total_tokens=48,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=255/500000]
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=48,960,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=256/500000]
+ train/ActionNoiseL2Loss=0.3169
+ throughput/total_tokens=49,152,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=257/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=49,344,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=258/500000]
+ train/ActionNoiseL2Loss=0.2130
+ throughput/total_tokens=49,536,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=259/500000]
+ train/ActionNoiseL2Loss=0.3105
+ throughput/total_tokens=49,728,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=260/500000]
+ optim/total_grad_norm=8.103
+ train/ActionNoiseL2Loss=0.2801
+ throughput/total_tokens=49,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=46,466
+[step=261/500000]
+ train/ActionNoiseL2Loss=0.2448
+ throughput/total_tokens=50,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=262/500000]
+ train/ActionNoiseL2Loss=0.2782
+ throughput/total_tokens=50,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=263/500000]
+ train/ActionNoiseL2Loss=0.2392
+ throughput/total_tokens=50,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=264/500000]
+ train/ActionNoiseL2Loss=0.2890
+ throughput/total_tokens=50,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=265/500000]
+ train/ActionNoiseL2Loss=0.2811
+ throughput/total_tokens=50,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=266/500000]
+ train/ActionNoiseL2Loss=0.3359
+ throughput/total_tokens=51,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=267/500000]
+ train/ActionNoiseL2Loss=0.2125
+ throughput/total_tokens=51,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=268/500000]
+ train/ActionNoiseL2Loss=0.1900
+ throughput/total_tokens=51,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=269/500000]
+ train/ActionNoiseL2Loss=0.3595
+ throughput/total_tokens=51,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=270/500000]
+ train/ActionNoiseL2Loss=0.2674
+ throughput/total_tokens=51,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=271/500000]
+ train/ActionNoiseL2Loss=0.2773
+ throughput/total_tokens=52,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=272/500000]
+ train/ActionNoiseL2Loss=0.1982
+ throughput/total_tokens=52,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=273/500000]
+ train/ActionNoiseL2Loss=0.3034
+ throughput/total_tokens=52,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=274/500000]
+ train/ActionNoiseL2Loss=0.3005
+ throughput/total_tokens=52,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=275/500000]
+ train/ActionNoiseL2Loss=0.2667
+ throughput/total_tokens=52,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=276/500000]
+ train/ActionNoiseL2Loss=0.2045
+ throughput/total_tokens=52,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=277/500000]
+ train/ActionNoiseL2Loss=0.3129
+ throughput/total_tokens=53,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=278/500000]
+ train/ActionNoiseL2Loss=0.2187
+ throughput/total_tokens=53,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=279/500000]
+ train/ActionNoiseL2Loss=0.2970
+ throughput/total_tokens=53,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=280/500000]
+ optim/total_grad_norm=14.38
+ train/ActionNoiseL2Loss=0.2773
+ throughput/total_tokens=53,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=281/500000]
+ train/ActionNoiseL2Loss=0.2798
+ throughput/total_tokens=53,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=282/500000]
+ train/ActionNoiseL2Loss=0.2945
+ throughput/total_tokens=54,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=283/500000]
+ train/ActionNoiseL2Loss=0.2091
+ throughput/total_tokens=54,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=284/500000]
+ train/ActionNoiseL2Loss=0.2583
+ throughput/total_tokens=54,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=285/500000]
+ train/ActionNoiseL2Loss=0.2045
+ throughput/total_tokens=54,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=286/500000]
+ train/ActionNoiseL2Loss=0.2624
+ throughput/total_tokens=54,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=287/500000]
+ train/ActionNoiseL2Loss=0.2372
+ throughput/total_tokens=55,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=288/500000]
+ train/ActionNoiseL2Loss=0.3396
+ throughput/total_tokens=55,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=289/500000]
+ train/ActionNoiseL2Loss=0.3507
+ throughput/total_tokens=55,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=290/500000]
+ train/ActionNoiseL2Loss=0.2419
+ throughput/total_tokens=55,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=291/500000]
+ train/ActionNoiseL2Loss=0.2690
+ throughput/total_tokens=55,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=292/500000]
+ train/ActionNoiseL2Loss=0.2186
+ throughput/total_tokens=56,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=293/500000]
+ train/ActionNoiseL2Loss=0.2667
+ throughput/total_tokens=56,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=294/500000]
+ train/ActionNoiseL2Loss=0.1711
+ throughput/total_tokens=56,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=295/500000]
+ train/ActionNoiseL2Loss=0.1939
+ throughput/total_tokens=56,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=296/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=56,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=297/500000]
+ train/ActionNoiseL2Loss=0.2816
+ throughput/total_tokens=57,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=298/500000]
+ train/ActionNoiseL2Loss=0.2784
+ throughput/total_tokens=57,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=299/500000]
+ train/ActionNoiseL2Loss=0.1944
+ throughput/total_tokens=57,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=300/500000]
+ optim/total_grad_norm=13.50
+ train/ActionNoiseL2Loss=0.3546
+ throughput/total_tokens=57,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=301/500000]
+ train/ActionNoiseL2Loss=0.1997
+ throughput/total_tokens=57,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=302/500000]
+ train/ActionNoiseL2Loss=0.1655
+ throughput/total_tokens=57,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=303/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=58,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=304/500000]
+ train/ActionNoiseL2Loss=0.2570
+ throughput/total_tokens=58,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=305/500000]
+ train/ActionNoiseL2Loss=0.2502
+ throughput/total_tokens=58,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=306/500000]
+ train/ActionNoiseL2Loss=0.2749
+ throughput/total_tokens=58,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=307/500000]
+ train/ActionNoiseL2Loss=0.2723
+ throughput/total_tokens=58,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=308/500000]
+ train/ActionNoiseL2Loss=0.2322
+ throughput/total_tokens=59,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=309/500000]
+ train/ActionNoiseL2Loss=0.2259
+ throughput/total_tokens=59,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=310/500000]
+ train/ActionNoiseL2Loss=0.3134
+ throughput/total_tokens=59,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=46,466
+[step=311/500000]
+ train/ActionNoiseL2Loss=0.1744
+ throughput/total_tokens=59,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=312/500000]
+ train/ActionNoiseL2Loss=0.2138
+ throughput/total_tokens=59,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=313/500000]
+ train/ActionNoiseL2Loss=0.2889
+ throughput/total_tokens=60,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=314/500000]
+ train/ActionNoiseL2Loss=0.2621
+ throughput/total_tokens=60,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=315/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=60,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=316/500000]
+ train/ActionNoiseL2Loss=0.2006
+ throughput/total_tokens=60,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=317/500000]
+ train/ActionNoiseL2Loss=0.2321
+ throughput/total_tokens=60,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=318/500000]
+ train/ActionNoiseL2Loss=0.2290
+ throughput/total_tokens=61,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=319/500000]
+ train/ActionNoiseL2Loss=0.2471
+ throughput/total_tokens=61,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=320/500000]
+ optim/total_grad_norm=8.710
+ train/ActionNoiseL2Loss=0.1936
+ throughput/total_tokens=61,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=321/500000]
+ train/ActionNoiseL2Loss=0.2509
+ throughput/total_tokens=61,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=322/500000]
+ train/ActionNoiseL2Loss=0.3493
+ throughput/total_tokens=61,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=323/500000]
+ train/ActionNoiseL2Loss=0.2690
+ throughput/total_tokens=62,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=324/500000]
+ train/ActionNoiseL2Loss=0.2110
+ throughput/total_tokens=62,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=325/500000]
+ train/ActionNoiseL2Loss=0.3516
+ throughput/total_tokens=62,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=326/500000]
+ train/ActionNoiseL2Loss=0.2037
+ throughput/total_tokens=62,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=327/500000]
+ train/ActionNoiseL2Loss=0.2345
+ throughput/total_tokens=62,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=328/500000]
+ train/ActionNoiseL2Loss=0.2386
+ throughput/total_tokens=62,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=329/500000]
+ train/ActionNoiseL2Loss=0.2019
+ throughput/total_tokens=63,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=330/500000]
+ train/ActionNoiseL2Loss=0.3407
+ throughput/total_tokens=63,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=331/500000]
+ train/ActionNoiseL2Loss=0.1779
+ throughput/total_tokens=63,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=332/500000]
+ train/ActionNoiseL2Loss=0.1966
+ throughput/total_tokens=63,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=333/500000]
+ train/ActionNoiseL2Loss=0.1975
+ throughput/total_tokens=63,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=334/500000]
+ train/ActionNoiseL2Loss=0.3297
+ throughput/total_tokens=64,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=335/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=64,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=336/500000]
+ train/ActionNoiseL2Loss=0.1853
+ throughput/total_tokens=64,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=337/500000]
+ train/ActionNoiseL2Loss=0.3215
+ throughput/total_tokens=64,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=338/500000]
+ train/ActionNoiseL2Loss=0.4389
+ throughput/total_tokens=64,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=339/500000]
+ train/ActionNoiseL2Loss=0.2957
+ throughput/total_tokens=65,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=340/500000]
+ optim/total_grad_norm=5.856
+ train/ActionNoiseL2Loss=0.1694
+ throughput/total_tokens=65,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=341/500000]
+ train/ActionNoiseL2Loss=0.2487
+ throughput/total_tokens=65,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=342/500000]
+ train/ActionNoiseL2Loss=0.3343
+ throughput/total_tokens=65,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=343/500000]
+ train/ActionNoiseL2Loss=0.2087
+ throughput/total_tokens=65,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=344/500000]
+ train/ActionNoiseL2Loss=0.1564
+ throughput/total_tokens=66,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=345/500000]
+ train/ActionNoiseL2Loss=0.2816
+ throughput/total_tokens=66,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=346/500000]
+ train/ActionNoiseL2Loss=0.1891
+ throughput/total_tokens=66,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=347/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=66,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=348/500000]
+ train/ActionNoiseL2Loss=0.2085
+ throughput/total_tokens=66,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=349/500000]
+ train/ActionNoiseL2Loss=0.3698
+ throughput/total_tokens=67,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=350/500000]
+ train/ActionNoiseL2Loss=0.2137
+ throughput/total_tokens=67,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=351/500000]
+ train/ActionNoiseL2Loss=0.2328
+ throughput/total_tokens=67,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=352/500000]
+ train/ActionNoiseL2Loss=0.3303
+ throughput/total_tokens=67,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=353/500000]
+ train/ActionNoiseL2Loss=0.2376
+ throughput/total_tokens=67,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=354/500000]
+ train/ActionNoiseL2Loss=0.1535
+ throughput/total_tokens=67,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=355/500000]
+ train/ActionNoiseL2Loss=0.2089
+ throughput/total_tokens=68,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=356/500000]
+ train/ActionNoiseL2Loss=0.2793
+ throughput/total_tokens=68,352,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=357/500000]
+ train/ActionNoiseL2Loss=0.2625
+ throughput/total_tokens=68,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=358/500000]
+ train/ActionNoiseL2Loss=0.2617
+ throughput/total_tokens=68,736,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=359/500000]
+ train/ActionNoiseL2Loss=0.1870
+ throughput/total_tokens=68,928,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=360/500000]
+ optim/total_grad_norm=10.34
+ train/ActionNoiseL2Loss=0.1837
+ throughput/total_tokens=69,120,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=361/500000]
+ train/ActionNoiseL2Loss=0.1845
+ throughput/total_tokens=69,312,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=362/500000]
+ train/ActionNoiseL2Loss=0.3257
+ throughput/total_tokens=69,504,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=363/500000]
+ train/ActionNoiseL2Loss=0.2476
+ throughput/total_tokens=69,696,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=364/500000]
+ train/ActionNoiseL2Loss=0.2298
+ throughput/total_tokens=69,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=365/500000]
+ train/ActionNoiseL2Loss=0.3286
+ throughput/total_tokens=70,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=366/500000]
+ train/ActionNoiseL2Loss=0.2485
+ throughput/total_tokens=70,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=367/500000]
+ train/ActionNoiseL2Loss=0.2720
+ throughput/total_tokens=70,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=368/500000]
+ train/ActionNoiseL2Loss=0.3115
+ throughput/total_tokens=70,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=369/500000]
+ train/ActionNoiseL2Loss=0.2014
+ throughput/total_tokens=70,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=370/500000]
+ train/ActionNoiseL2Loss=0.2187
+ throughput/total_tokens=71,040,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=371/500000]
+ train/ActionNoiseL2Loss=0.2221
+ throughput/total_tokens=71,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=372/500000]
+ train/ActionNoiseL2Loss=0.2432
+ throughput/total_tokens=71,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=373/500000]
+ train/ActionNoiseL2Loss=0.2190
+ throughput/total_tokens=71,616,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=374/500000]
+ train/ActionNoiseL2Loss=0.3320
+ throughput/total_tokens=71,808,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=375/500000]
+ train/ActionNoiseL2Loss=0.2550
+ throughput/total_tokens=72,000,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=376/500000]
+ train/ActionNoiseL2Loss=0.2535
+ throughput/total_tokens=72,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=377/500000]
+ train/ActionNoiseL2Loss=0.3073
+ throughput/total_tokens=72,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=378/500000]
+ train/ActionNoiseL2Loss=0.2906
+ throughput/total_tokens=72,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=379/500000]
+ train/ActionNoiseL2Loss=0.2609
+ throughput/total_tokens=72,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=380/500000]
+ optim/total_grad_norm=7.854
+ train/ActionNoiseL2Loss=0.2083
+ throughput/total_tokens=72,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=381/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=73,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=382/500000]
+ train/ActionNoiseL2Loss=0.1741
+ throughput/total_tokens=73,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=383/500000]
+ train/ActionNoiseL2Loss=0.3356
+ throughput/total_tokens=73,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=384/500000]
+ train/ActionNoiseL2Loss=0.2987
+ throughput/total_tokens=73,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=385/500000]
+ train/ActionNoiseL2Loss=0.1961
+ throughput/total_tokens=73,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=386/500000]
+ train/ActionNoiseL2Loss=0.2775
+ throughput/total_tokens=74,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=387/500000]
+ train/ActionNoiseL2Loss=0.1825
+ throughput/total_tokens=74,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=388/500000]
+ train/ActionNoiseL2Loss=0.2001
+ throughput/total_tokens=74,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=389/500000]
+ train/ActionNoiseL2Loss=0.1610
+ throughput/total_tokens=74,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=390/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=74,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=391/500000]
+ train/ActionNoiseL2Loss=0.3232
+ throughput/total_tokens=75,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=392/500000]
+ train/ActionNoiseL2Loss=0.2835
+ throughput/total_tokens=75,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=393/500000]
+ train/ActionNoiseL2Loss=0.2579
+ throughput/total_tokens=75,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=394/500000]
+ train/ActionNoiseL2Loss=0.2552
+ throughput/total_tokens=75,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=395/500000]
+ train/ActionNoiseL2Loss=0.2743
+ throughput/total_tokens=75,840,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=396/500000]
+ train/ActionNoiseL2Loss=0.1744
+ throughput/total_tokens=76,032,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=397/500000]
+ train/ActionNoiseL2Loss=0.2197
+ throughput/total_tokens=76,224,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=398/500000]
+ train/ActionNoiseL2Loss=0.1603
+ throughput/total_tokens=76,416,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=399/500000]
+ train/ActionNoiseL2Loss=0.1804
+ throughput/total_tokens=76,608,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=400/500000]
+ optim/total_grad_norm=7.568
+ train/ActionNoiseL2Loss=0.2300
+ throughput/total_tokens=76,800,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=401/500000]
+ train/ActionNoiseL2Loss=0.1663
+ throughput/total_tokens=76,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=402/500000]
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=77,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=403/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=77,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=404/500000]
+ train/ActionNoiseL2Loss=0.2422
+ throughput/total_tokens=77,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=405/500000]
+ train/ActionNoiseL2Loss=0.1551
+ throughput/total_tokens=77,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=406/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=77,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=407/500000]
+ train/ActionNoiseL2Loss=0.2006
+ throughput/total_tokens=78,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=408/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=78,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=409/500000]
+ train/ActionNoiseL2Loss=0.2361
+ throughput/total_tokens=78,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=410/500000]
+ train/ActionNoiseL2Loss=0.2913
+ throughput/total_tokens=78,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=46,466
+[step=411/500000]
+ train/ActionNoiseL2Loss=0.1979
+ throughput/total_tokens=78,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=412/500000]
+ train/ActionNoiseL2Loss=0.2596
+ throughput/total_tokens=79,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=413/500000]
+ train/ActionNoiseL2Loss=0.2898
+ throughput/total_tokens=79,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=414/500000]
+ train/ActionNoiseL2Loss=0.2442
+ throughput/total_tokens=79,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=415/500000]
+ train/ActionNoiseL2Loss=0.2265
+ throughput/total_tokens=79,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=416/500000]
+ train/ActionNoiseL2Loss=0.2631
+ throughput/total_tokens=79,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=417/500000]
+ train/ActionNoiseL2Loss=0.2071
+ throughput/total_tokens=80,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=418/500000]
+ train/ActionNoiseL2Loss=0.2431
+ throughput/total_tokens=80,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=419/500000]
+ train/ActionNoiseL2Loss=0.3303
+ throughput/total_tokens=80,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=420/500000]
+ optim/total_grad_norm=7.995
+ train/ActionNoiseL2Loss=0.3033
+ throughput/total_tokens=80,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=421/500000]
+ train/ActionNoiseL2Loss=0.2370
+ throughput/total_tokens=80,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=422/500000]
+ train/ActionNoiseL2Loss=0.2063
+ throughput/total_tokens=81,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=423/500000]
+ train/ActionNoiseL2Loss=0.2155
+ throughput/total_tokens=81,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=424/500000]
+ train/ActionNoiseL2Loss=0.1276
+ throughput/total_tokens=81,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=425/500000]
+ train/ActionNoiseL2Loss=0.2112
+ throughput/total_tokens=81,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=426/500000]
+ train/ActionNoiseL2Loss=0.1525
+ throughput/total_tokens=81,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=427/500000]
+ train/ActionNoiseL2Loss=0.1983
+ throughput/total_tokens=81,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=428/500000]
+ train/ActionNoiseL2Loss=0.1931
+ throughput/total_tokens=82,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=429/500000]
+ train/ActionNoiseL2Loss=0.2134
+ throughput/total_tokens=82,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=430/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=82,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=431/500000]
+ train/ActionNoiseL2Loss=0.1944
+ throughput/total_tokens=82,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=432/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=82,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=433/500000]
+ train/ActionNoiseL2Loss=0.1927
+ throughput/total_tokens=83,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=434/500000]
+ train/ActionNoiseL2Loss=0.1641
+ throughput/total_tokens=83,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=435/500000]
+ train/ActionNoiseL2Loss=0.1878
+ throughput/total_tokens=83,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=436/500000]
+ train/ActionNoiseL2Loss=0.2207
+ throughput/total_tokens=83,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=437/500000]
+ train/ActionNoiseL2Loss=0.2696
+ throughput/total_tokens=83,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=438/500000]
+ train/ActionNoiseL2Loss=0.2085
+ throughput/total_tokens=84,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=439/500000]
+ train/ActionNoiseL2Loss=0.1867
+ throughput/total_tokens=84,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=440/500000]
+ optim/total_grad_norm=5.137
+ train/ActionNoiseL2Loss=0.1762
+ throughput/total_tokens=84,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=441/500000]
+ train/ActionNoiseL2Loss=0.1976
+ throughput/total_tokens=84,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=442/500000]
+ train/ActionNoiseL2Loss=0.1882
+ throughput/total_tokens=84,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=443/500000]
+ train/ActionNoiseL2Loss=0.2452
+ throughput/total_tokens=85,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=444/500000]
+ train/ActionNoiseL2Loss=0.2898
+ throughput/total_tokens=85,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=445/500000]
+ train/ActionNoiseL2Loss=0.2574
+ throughput/total_tokens=85,440,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=446/500000]
+ train/ActionNoiseL2Loss=0.1816
+ throughput/total_tokens=85,632,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=447/500000]
+ train/ActionNoiseL2Loss=0.2526
+ throughput/total_tokens=85,824,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=448/500000]
+ train/ActionNoiseL2Loss=0.2209
+ throughput/total_tokens=86,016,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=449/500000]
+ train/ActionNoiseL2Loss=0.2346
+ throughput/total_tokens=86,208,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=450/500000]
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=86,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=451/500000]
+ train/ActionNoiseL2Loss=0.2793
+ throughput/total_tokens=86,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=452/500000]
+ train/ActionNoiseL2Loss=0.2283
+ throughput/total_tokens=86,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=453/500000]
+ train/ActionNoiseL2Loss=0.3598
+ throughput/total_tokens=86,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=454/500000]
+ train/ActionNoiseL2Loss=0.1979
+ throughput/total_tokens=87,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=455/500000]
+ train/ActionNoiseL2Loss=0.3167
+ throughput/total_tokens=87,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=456/500000]
+ train/ActionNoiseL2Loss=0.2627
+ throughput/total_tokens=87,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=457/500000]
+ train/ActionNoiseL2Loss=0.2170
+ throughput/total_tokens=87,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=458/500000]
+ train/ActionNoiseL2Loss=0.2300
+ throughput/total_tokens=87,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=459/500000]
+ train/ActionNoiseL2Loss=0.1317
+ throughput/total_tokens=88,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=460/500000]
+ optim/total_grad_norm=8.390
+ train/ActionNoiseL2Loss=0.2420
+ throughput/total_tokens=88,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,466
+[step=461/500000]
+ train/ActionNoiseL2Loss=0.2455
+ throughput/total_tokens=88,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=462/500000]
+ train/ActionNoiseL2Loss=0.2878
+ throughput/total_tokens=88,704,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=463/500000]
+ train/ActionNoiseL2Loss=0.2031
+ throughput/total_tokens=88,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=464/500000]
+ train/ActionNoiseL2Loss=0.2064
+ throughput/total_tokens=89,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=465/500000]
+ train/ActionNoiseL2Loss=0.1661
+ throughput/total_tokens=89,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=466/500000]
+ train/ActionNoiseL2Loss=0.1700
+ throughput/total_tokens=89,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=467/500000]
+ train/ActionNoiseL2Loss=0.2314
+ throughput/total_tokens=89,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=468/500000]
+ train/ActionNoiseL2Loss=0.2267
+ throughput/total_tokens=89,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=469/500000]
+ train/ActionNoiseL2Loss=0.1832
+ throughput/total_tokens=90,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=470/500000]
+ train/ActionNoiseL2Loss=0.2069
+ throughput/total_tokens=90,240,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=471/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=90,432,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=472/500000]
+ train/ActionNoiseL2Loss=0.1800
+ throughput/total_tokens=90,624,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=473/500000]
+ train/ActionNoiseL2Loss=0.2219
+ throughput/total_tokens=90,816,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=474/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=91,008,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=475/500000]
+ train/ActionNoiseL2Loss=0.1621
+ throughput/total_tokens=91,200,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=476/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=91,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=477/500000]
+ train/ActionNoiseL2Loss=0.2287
+ throughput/total_tokens=91,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=478/500000]
+ train/ActionNoiseL2Loss=0.1429
+ throughput/total_tokens=91,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=479/500000]
+ train/ActionNoiseL2Loss=0.1813
+ throughput/total_tokens=91,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=480/500000]
+ optim/total_grad_norm=7.148
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=92,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=481/500000]
+ train/ActionNoiseL2Loss=0.2582
+ throughput/total_tokens=92,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=482/500000]
+ train/ActionNoiseL2Loss=0.1535
+ throughput/total_tokens=92,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=483/500000]
+ train/ActionNoiseL2Loss=0.2651
+ throughput/total_tokens=92,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=484/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=92,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=485/500000]
+ train/ActionNoiseL2Loss=0.2179
+ throughput/total_tokens=93,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=486/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=93,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=487/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=93,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=488/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=93,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=489/500000]
+ train/ActionNoiseL2Loss=0.2238
+ throughput/total_tokens=93,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=490/500000]
+ train/ActionNoiseL2Loss=0.1695
+ throughput/total_tokens=94,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+[step=491/500000]
+ train/ActionNoiseL2Loss=0.1907
+ throughput/total_tokens=94,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=492/500000]
+ train/ActionNoiseL2Loss=0.1748
+ throughput/total_tokens=94,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=493/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=94,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=494/500000]
+ train/ActionNoiseL2Loss=0.1899
+ throughput/total_tokens=94,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=495/500000]
+ train/ActionNoiseL2Loss=0.2367
+ throughput/total_tokens=95,040,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=496/500000]
+ train/ActionNoiseL2Loss=0.2442
+ throughput/total_tokens=95,232,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=497/500000]
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=95,424,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=498/500000]
+ train/ActionNoiseL2Loss=0.2458
+ throughput/total_tokens=95,616,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=499/500000]
+ train/ActionNoiseL2Loss=0.1793
+ throughput/total_tokens=95,808,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=500/500000]
+ optim/total_grad_norm=7.854
+ train/ActionNoiseL2Loss=0.1621
+ throughput/total_tokens=96,000,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,466
+10/02 [19:33:09] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: warnings.py:109
+ FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and
+ set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc:
+ https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial:
+ https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html .
+ warnings.warn(
+
+10/02 [19:33:10] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:860: UserWarning: warnings.py:109
+ `_get_pg_default_device` will be deprecated, it only stays for backward-compatiblity reason. If you need to find a device for object
+ collectives, please use `_get_object_coll_device`. If you need to query the device types supported by group, please use
+ `_device_capability(group)`.
+ warnings.warn(
+
+10/02 [19:33:12] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:722: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ local_shape = tensor.shape
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:739: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.shape,
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:741: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.dtype,
+
+10/02 [19:33:16] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/overrides.py:1747: FutureWarning: Please use DTensor warnings.py:109
+ instead and we are deprecating ShardedTensor.
+ result = torch_func_method(public_api, types, args, kwargs)
+
+10/02 [19:33:48] INFO | >> Saving config... checkpoint.py:608
+10/02 [19:34:17] INFO | >> Saving model state... checkpoint.py:796
+10/02 [19:35:29] INFO | >> Saving optim state... checkpoint.py:811
+10/02 [19:37:00] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=501/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=96,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=502/500000]
+ train/ActionNoiseL2Loss=0.1530
+ throughput/total_tokens=96,384,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=503/500000]
+ train/ActionNoiseL2Loss=0.2660
+ throughput/total_tokens=96,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=504/500000]
+ train/ActionNoiseL2Loss=0.3441
+ throughput/total_tokens=96,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=505/500000]
+ train/ActionNoiseL2Loss=0.2195
+ throughput/total_tokens=96,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=506/500000]
+ train/ActionNoiseL2Loss=0.2184
+ throughput/total_tokens=97,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=507/500000]
+ train/ActionNoiseL2Loss=0.1570
+ throughput/total_tokens=97,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=508/500000]
+ train/ActionNoiseL2Loss=0.1659
+ throughput/total_tokens=97,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=509/500000]
+ train/ActionNoiseL2Loss=0.1862
+ throughput/total_tokens=97,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=510/500000]
+ train/ActionNoiseL2Loss=0.2464
+ throughput/total_tokens=97,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=511/500000]
+ train/ActionNoiseL2Loss=0.2415
+ throughput/total_tokens=98,112,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=512/500000]
+ train/ActionNoiseL2Loss=0.2539
+ throughput/total_tokens=98,304,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=513/500000]
+ train/ActionNoiseL2Loss=0.1989
+ throughput/total_tokens=98,496,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=514/500000]
+ train/ActionNoiseL2Loss=0.1777
+ throughput/total_tokens=98,688,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=515/500000]
+ train/ActionNoiseL2Loss=0.2258
+ throughput/total_tokens=98,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=516/500000]
+ train/ActionNoiseL2Loss=0.1630
+ throughput/total_tokens=99,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=517/500000]
+ train/ActionNoiseL2Loss=0.1877
+ throughput/total_tokens=99,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=518/500000]
+ train/ActionNoiseL2Loss=0.2142
+ throughput/total_tokens=99,456,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=519/500000]
+ train/ActionNoiseL2Loss=0.3204
+ throughput/total_tokens=99,648,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=520/500000]
+ optim/total_grad_norm=6.090
+ train/ActionNoiseL2Loss=0.1679
+ throughput/total_tokens=99,840,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=521/500000]
+ train/ActionNoiseL2Loss=0.1984
+ throughput/total_tokens=100,032,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=522/500000]
+ train/ActionNoiseL2Loss=0.2036
+ throughput/total_tokens=100,224,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=523/500000]
+ train/ActionNoiseL2Loss=0.1828
+ throughput/total_tokens=100,416,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=524/500000]
+ train/ActionNoiseL2Loss=0.2290
+ throughput/total_tokens=100,608,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=525/500000]
+ train/ActionNoiseL2Loss=0.2821
+ throughput/total_tokens=100,800,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=526/500000]
+ train/ActionNoiseL2Loss=0.2435
+ throughput/total_tokens=100,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=527/500000]
+ train/ActionNoiseL2Loss=0.2739
+ throughput/total_tokens=101,184,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=528/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=101,376,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=529/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=101,568,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=530/500000]
+ train/ActionNoiseL2Loss=0.2882
+ throughput/total_tokens=101,760,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=531/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=101,952,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=532/500000]
+ train/ActionNoiseL2Loss=0.1777
+ throughput/total_tokens=102,144,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=533/500000]
+ train/ActionNoiseL2Loss=0.3513
+ throughput/total_tokens=102,336,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=534/500000]
+ train/ActionNoiseL2Loss=0.2371
+ throughput/total_tokens=102,528,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=535/500000]
+ train/ActionNoiseL2Loss=0.2283
+ throughput/total_tokens=102,720,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=536/500000]
+ train/ActionNoiseL2Loss=0.3120
+ throughput/total_tokens=102,912,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=537/500000]
+ train/ActionNoiseL2Loss=0.2916
+ throughput/total_tokens=103,104,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=538/500000]
+ train/ActionNoiseL2Loss=0.2629
+ throughput/total_tokens=103,296,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=539/500000]
+ train/ActionNoiseL2Loss=0.1655
+ throughput/total_tokens=103,488,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=540/500000]
+ optim/total_grad_norm=5.171
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=103,680,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=541/500000]
+ train/ActionNoiseL2Loss=0.1572
+ throughput/total_tokens=103,872,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=542/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=104,064,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=543/500000]
+ train/ActionNoiseL2Loss=0.1667
+ throughput/total_tokens=104,256,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=544/500000]
+ train/ActionNoiseL2Loss=0.1933
+ throughput/total_tokens=104,448,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=545/500000]
+ train/ActionNoiseL2Loss=0.1798
+ throughput/total_tokens=104,640,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=546/500000]
+ train/ActionNoiseL2Loss=0.1458
+ throughput/total_tokens=104,832,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=547/500000]
+ train/ActionNoiseL2Loss=0.1652
+ throughput/total_tokens=105,024,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=548/500000]
+ train/ActionNoiseL2Loss=0.1807
+ throughput/total_tokens=105,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=549/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=105,408,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=550/500000]
+ train/ActionNoiseL2Loss=0.2255
+ throughput/total_tokens=105,600,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=551/500000]
+ train/ActionNoiseL2Loss=0.1599
+ throughput/total_tokens=105,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=552/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=105,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=553/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=106,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=554/500000]
+ train/ActionNoiseL2Loss=0.2247
+ throughput/total_tokens=106,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=555/500000]
+ train/ActionNoiseL2Loss=0.2723
+ throughput/total_tokens=106,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=556/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=106,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=557/500000]
+ train/ActionNoiseL2Loss=0.1829
+ throughput/total_tokens=106,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=558/500000]
+ train/ActionNoiseL2Loss=0.2645
+ throughput/total_tokens=107,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=559/500000]
+ train/ActionNoiseL2Loss=0.2718
+ throughput/total_tokens=107,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=560/500000]
+ optim/total_grad_norm=4.806
+ train/ActionNoiseL2Loss=0.1276
+ throughput/total_tokens=107,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=561/500000]
+ train/ActionNoiseL2Loss=0.1883
+ throughput/total_tokens=107,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=562/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=107,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=563/500000]
+ train/ActionNoiseL2Loss=0.2373
+ throughput/total_tokens=108,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=564/500000]
+ train/ActionNoiseL2Loss=0.2068
+ throughput/total_tokens=108,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=565/500000]
+ train/ActionNoiseL2Loss=0.1724
+ throughput/total_tokens=108,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=566/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=108,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=567/500000]
+ train/ActionNoiseL2Loss=0.2793
+ throughput/total_tokens=108,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=568/500000]
+ train/ActionNoiseL2Loss=0.2846
+ throughput/total_tokens=109,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=569/500000]
+ train/ActionNoiseL2Loss=0.1677
+ throughput/total_tokens=109,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=570/500000]
+ train/ActionNoiseL2Loss=0.1959
+ throughput/total_tokens=109,440,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=571/500000]
+ train/ActionNoiseL2Loss=0.2194
+ throughput/total_tokens=109,632,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=572/500000]
+ train/ActionNoiseL2Loss=0.1597
+ throughput/total_tokens=109,824,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=573/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=110,016,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=574/500000]
+ train/ActionNoiseL2Loss=0.1713
+ throughput/total_tokens=110,208,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=575/500000]
+ train/ActionNoiseL2Loss=0.2090
+ throughput/total_tokens=110,400,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=576/500000]
+ train/ActionNoiseL2Loss=0.1672
+ throughput/total_tokens=110,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=577/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=110,784,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=578/500000]
+ train/ActionNoiseL2Loss=0.1533
+ throughput/total_tokens=110,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=579/500000]
+ train/ActionNoiseL2Loss=0.2659
+ throughput/total_tokens=111,168,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=580/500000]
+ optim/total_grad_norm=6.352
+ train/ActionNoiseL2Loss=0.2190
+ throughput/total_tokens=111,360,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=581/500000]
+ train/ActionNoiseL2Loss=0.3135
+ throughput/total_tokens=111,552,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=582/500000]
+ train/ActionNoiseL2Loss=0.1870
+ throughput/total_tokens=111,744,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=583/500000]
+ train/ActionNoiseL2Loss=0.1836
+ throughput/total_tokens=111,936,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=584/500000]
+ train/ActionNoiseL2Loss=0.1996
+ throughput/total_tokens=112,128,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=585/500000]
+ train/ActionNoiseL2Loss=0.1778
+ throughput/total_tokens=112,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=586/500000]
+ train/ActionNoiseL2Loss=0.1848
+ throughput/total_tokens=112,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=587/500000]
+ train/ActionNoiseL2Loss=0.1663
+ throughput/total_tokens=112,704,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=588/500000]
+ train/ActionNoiseL2Loss=0.2324
+ throughput/total_tokens=112,896,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=589/500000]
+ train/ActionNoiseL2Loss=0.2922
+ throughput/total_tokens=113,088,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=590/500000]
+ train/ActionNoiseL2Loss=0.2182
+ throughput/total_tokens=113,280,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=591/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=113,472,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=592/500000]
+ train/ActionNoiseL2Loss=0.2171
+ throughput/total_tokens=113,664,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=593/500000]
+ train/ActionNoiseL2Loss=0.2130
+ throughput/total_tokens=113,856,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=594/500000]
+ train/ActionNoiseL2Loss=0.2179
+ throughput/total_tokens=114,048,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=595/500000]
+ train/ActionNoiseL2Loss=0.2466
+ throughput/total_tokens=114,240,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=596/500000]
+ train/ActionNoiseL2Loss=0.2147
+ throughput/total_tokens=114,432,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=597/500000]
+ train/ActionNoiseL2Loss=0.2051
+ throughput/total_tokens=114,624,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=598/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=114,816,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=599/500000]
+ train/ActionNoiseL2Loss=0.2555
+ throughput/total_tokens=115,008,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=600/500000]
+ optim/total_grad_norm=6.384
+ train/ActionNoiseL2Loss=0.1734
+ throughput/total_tokens=115,200,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=601/500000]
+ train/ActionNoiseL2Loss=0.2594
+ throughput/total_tokens=115,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=602/500000]
+ train/ActionNoiseL2Loss=0.2443
+ throughput/total_tokens=115,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=603/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=115,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=604/500000]
+ train/ActionNoiseL2Loss=0.2030
+ throughput/total_tokens=115,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=605/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=116,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=606/500000]
+ train/ActionNoiseL2Loss=0.1498
+ throughput/total_tokens=116,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=607/500000]
+ train/ActionNoiseL2Loss=0.1638
+ throughput/total_tokens=116,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=608/500000]
+ train/ActionNoiseL2Loss=0.1656
+ throughput/total_tokens=116,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=609/500000]
+ train/ActionNoiseL2Loss=0.2403
+ throughput/total_tokens=116,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=610/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=117,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=611/500000]
+ train/ActionNoiseL2Loss=0.1461
+ throughput/total_tokens=117,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=612/500000]
+ train/ActionNoiseL2Loss=0.2374
+ throughput/total_tokens=117,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=613/500000]
+ train/ActionNoiseL2Loss=0.1371
+ throughput/total_tokens=117,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=614/500000]
+ train/ActionNoiseL2Loss=0.1547
+ throughput/total_tokens=117,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=615/500000]
+ train/ActionNoiseL2Loss=0.2202
+ throughput/total_tokens=118,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=616/500000]
+ train/ActionNoiseL2Loss=0.2198
+ throughput/total_tokens=118,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=617/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=118,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=618/500000]
+ train/ActionNoiseL2Loss=0.1823
+ throughput/total_tokens=118,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=619/500000]
+ train/ActionNoiseL2Loss=0.2708
+ throughput/total_tokens=118,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=620/500000]
+ optim/total_grad_norm=5.403
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=119,040,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=621/500000]
+ train/ActionNoiseL2Loss=0.1596
+ throughput/total_tokens=119,232,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=622/500000]
+ train/ActionNoiseL2Loss=0.2501
+ throughput/total_tokens=119,424,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=623/500000]
+ train/ActionNoiseL2Loss=0.1961
+ throughput/total_tokens=119,616,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=624/500000]
+ train/ActionNoiseL2Loss=0.1649
+ throughput/total_tokens=119,808,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=625/500000]
+ train/ActionNoiseL2Loss=0.2027
+ throughput/total_tokens=120,000,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=626/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=120,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=627/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=120,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=628/500000]
+ train/ActionNoiseL2Loss=0.2690
+ throughput/total_tokens=120,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=629/500000]
+ train/ActionNoiseL2Loss=0.2904
+ throughput/total_tokens=120,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=630/500000]
+ train/ActionNoiseL2Loss=0.2439
+ throughput/total_tokens=120,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=631/500000]
+ train/ActionNoiseL2Loss=0.1738
+ throughput/total_tokens=121,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=632/500000]
+ train/ActionNoiseL2Loss=0.2845
+ throughput/total_tokens=121,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=633/500000]
+ train/ActionNoiseL2Loss=0.1831
+ throughput/total_tokens=121,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=634/500000]
+ train/ActionNoiseL2Loss=0.2294
+ throughput/total_tokens=121,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=635/500000]
+ train/ActionNoiseL2Loss=0.1791
+ throughput/total_tokens=121,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=636/500000]
+ train/ActionNoiseL2Loss=0.2416
+ throughput/total_tokens=122,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=637/500000]
+ train/ActionNoiseL2Loss=0.1801
+ throughput/total_tokens=122,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=638/500000]
+ train/ActionNoiseL2Loss=0.2570
+ throughput/total_tokens=122,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=639/500000]
+ train/ActionNoiseL2Loss=0.1626
+ throughput/total_tokens=122,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=640/500000]
+ optim/total_grad_norm=4.909
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=122,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=641/500000]
+ train/ActionNoiseL2Loss=0.2247
+ throughput/total_tokens=123,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=642/500000]
+ train/ActionNoiseL2Loss=0.2047
+ throughput/total_tokens=123,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=643/500000]
+ train/ActionNoiseL2Loss=0.2031
+ throughput/total_tokens=123,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=644/500000]
+ train/ActionNoiseL2Loss=0.2386
+ throughput/total_tokens=123,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=645/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=123,840,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=646/500000]
+ train/ActionNoiseL2Loss=0.1892
+ throughput/total_tokens=124,032,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=647/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=124,224,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=648/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=124,416,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=649/500000]
+ train/ActionNoiseL2Loss=0.1748
+ throughput/total_tokens=124,608,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=650/500000]
+ train/ActionNoiseL2Loss=0.1659
+ throughput/total_tokens=124,800,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=651/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=124,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=652/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=125,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=653/500000]
+ train/ActionNoiseL2Loss=0.1455
+ throughput/total_tokens=125,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=654/500000]
+ train/ActionNoiseL2Loss=0.1725
+ throughput/total_tokens=125,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=655/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=125,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=656/500000]
+ train/ActionNoiseL2Loss=0.1342
+ throughput/total_tokens=125,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=657/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=126,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=658/500000]
+ train/ActionNoiseL2Loss=0.1596
+ throughput/total_tokens=126,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=659/500000]
+ train/ActionNoiseL2Loss=0.1994
+ throughput/total_tokens=126,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=660/500000]
+ optim/total_grad_norm=8.607
+ train/ActionNoiseL2Loss=0.2501
+ throughput/total_tokens=126,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=661/500000]
+ train/ActionNoiseL2Loss=0.1808
+ throughput/total_tokens=126,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=662/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=127,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=663/500000]
+ train/ActionNoiseL2Loss=0.1657
+ throughput/total_tokens=127,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=664/500000]
+ train/ActionNoiseL2Loss=0.3033
+ throughput/total_tokens=127,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=665/500000]
+ train/ActionNoiseL2Loss=0.2500
+ throughput/total_tokens=127,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=666/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=127,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=667/500000]
+ train/ActionNoiseL2Loss=0.3252
+ throughput/total_tokens=128,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=668/500000]
+ train/ActionNoiseL2Loss=0.1371
+ throughput/total_tokens=128,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=669/500000]
+ train/ActionNoiseL2Loss=0.1541
+ throughput/total_tokens=128,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=670/500000]
+ train/ActionNoiseL2Loss=0.3200
+ throughput/total_tokens=128,640,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=671/500000]
+ train/ActionNoiseL2Loss=0.1560
+ throughput/total_tokens=128,832,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=672/500000]
+ train/ActionNoiseL2Loss=0.1485
+ throughput/total_tokens=129,024,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=673/500000]
+ train/ActionNoiseL2Loss=0.1790
+ throughput/total_tokens=129,216,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=674/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=129,408,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=675/500000]
+ train/ActionNoiseL2Loss=0.1862
+ throughput/total_tokens=129,600,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=676/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=129,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=677/500000]
+ train/ActionNoiseL2Loss=0.1916
+ throughput/total_tokens=129,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=678/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=130,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=679/500000]
+ train/ActionNoiseL2Loss=0.1434
+ throughput/total_tokens=130,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=680/500000]
+ optim/total_grad_norm=10.83
+ train/ActionNoiseL2Loss=0.3268
+ throughput/total_tokens=130,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=681/500000]
+ train/ActionNoiseL2Loss=0.3122
+ throughput/total_tokens=130,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=682/500000]
+ train/ActionNoiseL2Loss=0.1916
+ throughput/total_tokens=130,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=683/500000]
+ train/ActionNoiseL2Loss=0.1461
+ throughput/total_tokens=131,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=684/500000]
+ train/ActionNoiseL2Loss=0.3319
+ throughput/total_tokens=131,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=685/500000]
+ train/ActionNoiseL2Loss=0.2466
+ throughput/total_tokens=131,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=686/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=131,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=687/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=131,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=688/500000]
+ train/ActionNoiseL2Loss=0.1890
+ throughput/total_tokens=132,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=689/500000]
+ train/ActionNoiseL2Loss=0.1689
+ throughput/total_tokens=132,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=690/500000]
+ train/ActionNoiseL2Loss=0.2583
+ throughput/total_tokens=132,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=691/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=132,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=692/500000]
+ train/ActionNoiseL2Loss=0.2112
+ throughput/total_tokens=132,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=693/500000]
+ train/ActionNoiseL2Loss=0.2673
+ throughput/total_tokens=133,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=694/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=133,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=695/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=133,440,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=696/500000]
+ train/ActionNoiseL2Loss=0.2819
+ throughput/total_tokens=133,632,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=697/500000]
+ train/ActionNoiseL2Loss=0.2091
+ throughput/total_tokens=133,824,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=698/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=134,016,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=699/500000]
+ train/ActionNoiseL2Loss=0.1923
+ throughput/total_tokens=134,208,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=700/500000]
+ optim/total_grad_norm=5.558
+ train/ActionNoiseL2Loss=0.1434
+ throughput/total_tokens=134,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=701/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=134,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=702/500000]
+ train/ActionNoiseL2Loss=0.1938
+ throughput/total_tokens=134,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=703/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=134,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=704/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=135,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=705/500000]
+ train/ActionNoiseL2Loss=0.1781
+ throughput/total_tokens=135,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=706/500000]
+ train/ActionNoiseL2Loss=0.1513
+ throughput/total_tokens=135,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=707/500000]
+ train/ActionNoiseL2Loss=0.2424
+ throughput/total_tokens=135,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=708/500000]
+ train/ActionNoiseL2Loss=0.2168
+ throughput/total_tokens=135,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=709/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=136,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=710/500000]
+ train/ActionNoiseL2Loss=0.1958
+ throughput/total_tokens=136,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=711/500000]
+ train/ActionNoiseL2Loss=0.1832
+ throughput/total_tokens=136,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=712/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=136,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=713/500000]
+ train/ActionNoiseL2Loss=0.2449
+ throughput/total_tokens=136,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=714/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=137,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=715/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=137,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=716/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=137,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=717/500000]
+ train/ActionNoiseL2Loss=0.1963
+ throughput/total_tokens=137,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=718/500000]
+ train/ActionNoiseL2Loss=0.2297
+ throughput/total_tokens=137,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=719/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=138,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=720/500000]
+ optim/total_grad_norm=6.196
+ train/ActionNoiseL2Loss=0.1791
+ throughput/total_tokens=138,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=721/500000]
+ train/ActionNoiseL2Loss=0.1620
+ throughput/total_tokens=138,432,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=722/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=138,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=723/500000]
+ train/ActionNoiseL2Loss=0.2290
+ throughput/total_tokens=138,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=724/500000]
+ train/ActionNoiseL2Loss=0.1770
+ throughput/total_tokens=139,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=725/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=139,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=726/500000]
+ train/ActionNoiseL2Loss=0.1834
+ throughput/total_tokens=139,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=727/500000]
+ train/ActionNoiseL2Loss=0.1748
+ throughput/total_tokens=139,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=728/500000]
+ train/ActionNoiseL2Loss=0.2323
+ throughput/total_tokens=139,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=729/500000]
+ train/ActionNoiseL2Loss=0.1802
+ throughput/total_tokens=139,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=730/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=140,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=731/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=140,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=732/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=140,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=733/500000]
+ train/ActionNoiseL2Loss=0.1620
+ throughput/total_tokens=140,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=734/500000]
+ train/ActionNoiseL2Loss=0.2452
+ throughput/total_tokens=140,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=735/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=141,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=736/500000]
+ train/ActionNoiseL2Loss=0.1481
+ throughput/total_tokens=141,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=737/500000]
+ train/ActionNoiseL2Loss=0.1923
+ throughput/total_tokens=141,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=738/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=141,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=739/500000]
+ train/ActionNoiseL2Loss=0.2488
+ throughput/total_tokens=141,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=740/500000]
+ optim/total_grad_norm=5.064
+ train/ActionNoiseL2Loss=0.1734
+ throughput/total_tokens=142,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=741/500000]
+ train/ActionNoiseL2Loss=0.5691
+ throughput/total_tokens=142,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=742/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=142,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=743/500000]
+ train/ActionNoiseL2Loss=0.1977
+ throughput/total_tokens=142,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=744/500000]
+ train/ActionNoiseL2Loss=0.1909
+ throughput/total_tokens=142,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=745/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=143,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=746/500000]
+ train/ActionNoiseL2Loss=0.1493
+ throughput/total_tokens=143,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=747/500000]
+ train/ActionNoiseL2Loss=0.2031
+ throughput/total_tokens=143,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=748/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=143,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=749/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=143,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=750/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=144,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=751/500000]
+ train/ActionNoiseL2Loss=0.1666
+ throughput/total_tokens=144,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=752/500000]
+ train/ActionNoiseL2Loss=0.1727
+ throughput/total_tokens=144,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=753/500000]
+ train/ActionNoiseL2Loss=0.1812
+ throughput/total_tokens=144,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=754/500000]
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=144,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=755/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=144,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=756/500000]
+ train/ActionNoiseL2Loss=0.2009
+ throughput/total_tokens=145,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=757/500000]
+ train/ActionNoiseL2Loss=0.1835
+ throughput/total_tokens=145,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=758/500000]
+ train/ActionNoiseL2Loss=0.1692
+ throughput/total_tokens=145,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=759/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=145,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=760/500000]
+ optim/total_grad_norm=9.283
+ train/ActionNoiseL2Loss=0.2942
+ throughput/total_tokens=145,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=761/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=146,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=762/500000]
+ train/ActionNoiseL2Loss=0.2472
+ throughput/total_tokens=146,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=763/500000]
+ train/ActionNoiseL2Loss=0.1847
+ throughput/total_tokens=146,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=764/500000]
+ train/ActionNoiseL2Loss=0.2181
+ throughput/total_tokens=146,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=765/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=146,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=766/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=147,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=767/500000]
+ train/ActionNoiseL2Loss=0.1433
+ throughput/total_tokens=147,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=768/500000]
+ train/ActionNoiseL2Loss=0.1725
+ throughput/total_tokens=147,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=769/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=147,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=770/500000]
+ train/ActionNoiseL2Loss=0.1983
+ throughput/total_tokens=147,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=771/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=148,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=772/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=148,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=773/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=148,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=774/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=148,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=775/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=148,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=776/500000]
+ train/ActionNoiseL2Loss=0.2523
+ throughput/total_tokens=148,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=777/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=149,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=778/500000]
+ train/ActionNoiseL2Loss=0.2039
+ throughput/total_tokens=149,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=779/500000]
+ train/ActionNoiseL2Loss=0.2214
+ throughput/total_tokens=149,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=780/500000]
+ optim/total_grad_norm=6.529
+ train/ActionNoiseL2Loss=0.2118
+ throughput/total_tokens=149,760,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=781/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=149,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=782/500000]
+ train/ActionNoiseL2Loss=0.2339
+ throughput/total_tokens=150,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=783/500000]
+ train/ActionNoiseL2Loss=0.2051
+ throughput/total_tokens=150,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=784/500000]
+ train/ActionNoiseL2Loss=0.1946
+ throughput/total_tokens=150,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=785/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=150,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=786/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=150,912,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=787/500000]
+ train/ActionNoiseL2Loss=0.1987
+ throughput/total_tokens=151,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=788/500000]
+ train/ActionNoiseL2Loss=0.1574
+ throughput/total_tokens=151,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=789/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=151,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=790/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=151,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=791/500000]
+ train/ActionNoiseL2Loss=0.2105
+ throughput/total_tokens=151,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=792/500000]
+ train/ActionNoiseL2Loss=0.1400
+ throughput/total_tokens=152,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=793/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=152,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=794/500000]
+ train/ActionNoiseL2Loss=0.2196
+ throughput/total_tokens=152,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=795/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=152,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=796/500000]
+ train/ActionNoiseL2Loss=0.2115
+ throughput/total_tokens=152,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=797/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=153,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=798/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=153,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=799/500000]
+ train/ActionNoiseL2Loss=0.1658
+ throughput/total_tokens=153,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=800/500000]
+ optim/total_grad_norm=4.071
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=153,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=801/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=153,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=802/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=153,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=803/500000]
+ train/ActionNoiseL2Loss=0.2097
+ throughput/total_tokens=154,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=804/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=154,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=805/500000]
+ train/ActionNoiseL2Loss=0.1668
+ throughput/total_tokens=154,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=806/500000]
+ train/ActionNoiseL2Loss=0.1626
+ throughput/total_tokens=154,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=807/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=154,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=808/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=155,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=809/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=155,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=810/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=155,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=811/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=155,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=812/500000]
+ train/ActionNoiseL2Loss=0.2101
+ throughput/total_tokens=155,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=813/500000]
+ train/ActionNoiseL2Loss=0.1459
+ throughput/total_tokens=156,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=814/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=156,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=815/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=156,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=816/500000]
+ train/ActionNoiseL2Loss=0.2086
+ throughput/total_tokens=156,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=817/500000]
+ train/ActionNoiseL2Loss=0.1712
+ throughput/total_tokens=156,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=818/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=157,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=819/500000]
+ train/ActionNoiseL2Loss=0.1607
+ throughput/total_tokens=157,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=820/500000]
+ optim/total_grad_norm=6.825
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=157,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=821/500000]
+ train/ActionNoiseL2Loss=0.1680
+ throughput/total_tokens=157,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=822/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=157,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=823/500000]
+ train/ActionNoiseL2Loss=0.1863
+ throughput/total_tokens=158,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=824/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=158,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=825/500000]
+ train/ActionNoiseL2Loss=0.1831
+ throughput/total_tokens=158,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=826/500000]
+ train/ActionNoiseL2Loss=0.2353
+ throughput/total_tokens=158,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=827/500000]
+ train/ActionNoiseL2Loss=0.2001
+ throughput/total_tokens=158,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=828/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=158,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=829/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=159,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=830/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=159,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=831/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=159,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=832/500000]
+ train/ActionNoiseL2Loss=0.1717
+ throughput/total_tokens=159,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=833/500000]
+ train/ActionNoiseL2Loss=0.1867
+ throughput/total_tokens=159,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=834/500000]
+ train/ActionNoiseL2Loss=0.1557
+ throughput/total_tokens=160,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=835/500000]
+ train/ActionNoiseL2Loss=0.1417
+ throughput/total_tokens=160,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=836/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=160,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=837/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=160,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=838/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=160,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=839/500000]
+ train/ActionNoiseL2Loss=0.1887
+ throughput/total_tokens=161,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=840/500000]
+ optim/total_grad_norm=4.136
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=161,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=841/500000]
+ train/ActionNoiseL2Loss=0.2147
+ throughput/total_tokens=161,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=842/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=161,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=843/500000]
+ train/ActionNoiseL2Loss=0.1647
+ throughput/total_tokens=161,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=844/500000]
+ train/ActionNoiseL2Loss=0.1500
+ throughput/total_tokens=162,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=845/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=162,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=846/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=162,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=847/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=162,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=848/500000]
+ train/ActionNoiseL2Loss=0.1573
+ throughput/total_tokens=162,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=849/500000]
+ train/ActionNoiseL2Loss=0.2257
+ throughput/total_tokens=163,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=850/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=163,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=851/500000]
+ train/ActionNoiseL2Loss=0.1345
+ throughput/total_tokens=163,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=852/500000]
+ train/ActionNoiseL2Loss=0.1670
+ throughput/total_tokens=163,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=853/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=163,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=854/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=163,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=855/500000]
+ train/ActionNoiseL2Loss=0.2748
+ throughput/total_tokens=164,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=856/500000]
+ train/ActionNoiseL2Loss=0.1834
+ throughput/total_tokens=164,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=857/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=164,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=858/500000]
+ train/ActionNoiseL2Loss=0.1688
+ throughput/total_tokens=164,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=859/500000]
+ train/ActionNoiseL2Loss=0.3518
+ throughput/total_tokens=164,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=860/500000]
+ optim/total_grad_norm=8.800
+ train/ActionNoiseL2Loss=0.1977
+ throughput/total_tokens=165,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=861/500000]
+ train/ActionNoiseL2Loss=0.2296
+ throughput/total_tokens=165,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=862/500000]
+ train/ActionNoiseL2Loss=0.2021
+ throughput/total_tokens=165,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=863/500000]
+ train/ActionNoiseL2Loss=0.2903
+ throughput/total_tokens=165,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=864/500000]
+ train/ActionNoiseL2Loss=0.3246
+ throughput/total_tokens=165,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=865/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=166,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=866/500000]
+ train/ActionNoiseL2Loss=0.3162
+ throughput/total_tokens=166,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=867/500000]
+ train/ActionNoiseL2Loss=0.1836
+ throughput/total_tokens=166,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=868/500000]
+ train/ActionNoiseL2Loss=0.1695
+ throughput/total_tokens=166,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=869/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=166,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=870/500000]
+ train/ActionNoiseL2Loss=0.1637
+ throughput/total_tokens=167,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=871/500000]
+ train/ActionNoiseL2Loss=0.1568
+ throughput/total_tokens=167,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=872/500000]
+ train/ActionNoiseL2Loss=0.2287
+ throughput/total_tokens=167,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=873/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=167,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=874/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=167,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=875/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=168,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=876/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=168,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=877/500000]
+ train/ActionNoiseL2Loss=0.1941
+ throughput/total_tokens=168,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=878/500000]
+ train/ActionNoiseL2Loss=0.1818
+ throughput/total_tokens=168,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=879/500000]
+ train/ActionNoiseL2Loss=0.1682
+ throughput/total_tokens=168,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=880/500000]
+ optim/total_grad_norm=4.237
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=168,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=881/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=169,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=882/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=169,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=883/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=169,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=884/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=169,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=885/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=169,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=886/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=170,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=887/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=170,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=888/500000]
+ train/ActionNoiseL2Loss=0.2276
+ throughput/total_tokens=170,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=889/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=170,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=890/500000]
+ train/ActionNoiseL2Loss=0.1956
+ throughput/total_tokens=170,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=891/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=171,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=892/500000]
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=171,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=893/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=171,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=894/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=171,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=895/500000]
+ train/ActionNoiseL2Loss=0.1698
+ throughput/total_tokens=171,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=896/500000]
+ train/ActionNoiseL2Loss=0.1804
+ throughput/total_tokens=172,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=897/500000]
+ train/ActionNoiseL2Loss=0.1816
+ throughput/total_tokens=172,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=898/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=172,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=899/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=172,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=900/500000]
+ optim/total_grad_norm=3.651
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=172,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=901/500000]
+ train/ActionNoiseL2Loss=0.1501
+ throughput/total_tokens=172,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=902/500000]
+ train/ActionNoiseL2Loss=0.2208
+ throughput/total_tokens=173,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=903/500000]
+ train/ActionNoiseL2Loss=0.1723
+ throughput/total_tokens=173,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=904/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=173,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=905/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=173,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=906/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=173,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=907/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=174,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=908/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=174,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=909/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=174,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=910/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=174,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=911/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=174,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=912/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=175,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=913/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=175,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=914/500000]
+ train/ActionNoiseL2Loss=0.1541
+ throughput/total_tokens=175,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=915/500000]
+ train/ActionNoiseL2Loss=0.1766
+ throughput/total_tokens=175,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=916/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=175,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=917/500000]
+ train/ActionNoiseL2Loss=0.1456
+ throughput/total_tokens=176,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=918/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=176,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=919/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=176,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=920/500000]
+ optim/total_grad_norm=5.819
+ train/ActionNoiseL2Loss=0.1375
+ throughput/total_tokens=176,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=921/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=176,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=922/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=177,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=923/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=177,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=924/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=177,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=925/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=177,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=926/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=177,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=927/500000]
+ train/ActionNoiseL2Loss=0.1513
+ throughput/total_tokens=177,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=928/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=178,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=929/500000]
+ train/ActionNoiseL2Loss=0.1650
+ throughput/total_tokens=178,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=930/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=178,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=931/500000]
+ train/ActionNoiseL2Loss=0.2923
+ throughput/total_tokens=178,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=932/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=178,944,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=933/500000]
+ train/ActionNoiseL2Loss=0.2503
+ throughput/total_tokens=179,136,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=934/500000]
+ train/ActionNoiseL2Loss=0.1612
+ throughput/total_tokens=179,328,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=935/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=179,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=936/500000]
+ train/ActionNoiseL2Loss=0.1532
+ throughput/total_tokens=179,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=937/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=179,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=938/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=180,096,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=939/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=180,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=940/500000]
+ optim/total_grad_norm=5.268
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=180,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=941/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=180,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=942/500000]
+ train/ActionNoiseL2Loss=0.3448
+ throughput/total_tokens=180,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=943/500000]
+ train/ActionNoiseL2Loss=0.1829
+ throughput/total_tokens=181,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=944/500000]
+ train/ActionNoiseL2Loss=0.1327
+ throughput/total_tokens=181,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=945/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=181,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=946/500000]
+ train/ActionNoiseL2Loss=0.2025
+ throughput/total_tokens=181,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=947/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=181,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=948/500000]
+ train/ActionNoiseL2Loss=0.2028
+ throughput/total_tokens=182,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=949/500000]
+ train/ActionNoiseL2Loss=0.1469
+ throughput/total_tokens=182,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=950/500000]
+ train/ActionNoiseL2Loss=0.1953
+ throughput/total_tokens=182,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=951/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=182,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=952/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=182,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=953/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=182,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=954/500000]
+ train/ActionNoiseL2Loss=0.2855
+ throughput/total_tokens=183,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=955/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=183,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=956/500000]
+ train/ActionNoiseL2Loss=0.2340
+ throughput/total_tokens=183,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=957/500000]
+ train/ActionNoiseL2Loss=0.1837
+ throughput/total_tokens=183,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=958/500000]
+ train/ActionNoiseL2Loss=0.1979
+ throughput/total_tokens=183,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=959/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=184,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=960/500000]
+ optim/total_grad_norm=5.818
+ train/ActionNoiseL2Loss=0.1388
+ throughput/total_tokens=184,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=961/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=184,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=962/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=184,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=963/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=184,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=964/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=185,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=965/500000]
+ train/ActionNoiseL2Loss=0.1457
+ throughput/total_tokens=185,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=966/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=185,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=967/500000]
+ train/ActionNoiseL2Loss=0.1945
+ throughput/total_tokens=185,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=968/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=185,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=969/500000]
+ train/ActionNoiseL2Loss=0.1914
+ throughput/total_tokens=186,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=970/500000]
+ train/ActionNoiseL2Loss=0.2915
+ throughput/total_tokens=186,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=971/500000]
+ train/ActionNoiseL2Loss=0.1539
+ throughput/total_tokens=186,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=972/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=186,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=973/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=186,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=974/500000]
+ train/ActionNoiseL2Loss=0.2049
+ throughput/total_tokens=187,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=975/500000]
+ train/ActionNoiseL2Loss=0.1798
+ throughput/total_tokens=187,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=976/500000]
+ train/ActionNoiseL2Loss=0.2216
+ throughput/total_tokens=187,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=977/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=187,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=978/500000]
+ train/ActionNoiseL2Loss=0.2503
+ throughput/total_tokens=187,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=979/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=187,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=980/500000]
+ optim/total_grad_norm=5.260
+ train/ActionNoiseL2Loss=0.1422
+ throughput/total_tokens=188,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=981/500000]
+ train/ActionNoiseL2Loss=0.2035
+ throughput/total_tokens=188,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=982/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=188,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=983/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=188,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=984/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=188,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=985/500000]
+ train/ActionNoiseL2Loss=0.1253
+ throughput/total_tokens=189,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=986/500000]
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=189,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=987/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=189,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=988/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=189,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=989/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=189,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=990/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=190,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=991/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=190,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=992/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=190,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=993/500000]
+ train/ActionNoiseL2Loss=0.2059
+ throughput/total_tokens=190,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=994/500000]
+ train/ActionNoiseL2Loss=0.2097
+ throughput/total_tokens=190,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=995/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=191,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=996/500000]
+ train/ActionNoiseL2Loss=0.2354
+ throughput/total_tokens=191,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=997/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=191,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=998/500000]
+ train/ActionNoiseL2Loss=0.1670
+ throughput/total_tokens=191,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=999/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=191,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1000/500000]
+ optim/total_grad_norm=5.061
+ train/ActionNoiseL2Loss=0.1718
+ throughput/total_tokens=192,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/02 [22:31:35] INFO | >> Saving config... checkpoint.py:608
+10/02 [22:32:15] INFO | >> Saving model state... checkpoint.py:796
+10/02 [22:33:26] INFO | >> Saving optim state... checkpoint.py:811
+10/02 [22:34:56] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1001/500000]
+ train/ActionNoiseL2Loss=0.2947
+ throughput/total_tokens=192,192,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=1002/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=192,384,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=1003/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=192,576,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1004/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=192,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1005/500000]
+ train/ActionNoiseL2Loss=0.1224
+ throughput/total_tokens=192,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1006/500000]
+ train/ActionNoiseL2Loss=0.2017
+ throughput/total_tokens=193,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1007/500000]
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=193,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1008/500000]
+ train/ActionNoiseL2Loss=0.1844
+ throughput/total_tokens=193,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1009/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=193,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1010/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=193,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1011/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=194,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1012/500000]
+ train/ActionNoiseL2Loss=0.1693
+ throughput/total_tokens=194,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1013/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=194,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1014/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=194,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1015/500000]
+ train/ActionNoiseL2Loss=0.1621
+ throughput/total_tokens=194,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1016/500000]
+ train/ActionNoiseL2Loss=0.1637
+ throughput/total_tokens=195,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1017/500000]
+ train/ActionNoiseL2Loss=0.1772
+ throughput/total_tokens=195,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1018/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=195,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1019/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=195,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1020/500000]
+ optim/total_grad_norm=4.445
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=195,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1021/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=196,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1022/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=196,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1023/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=196,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1024/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=196,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1025/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=196,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1026/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=196,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1027/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=197,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1028/500000]
+ train/ActionNoiseL2Loss=0.1655
+ throughput/total_tokens=197,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1029/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=197,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1030/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=197,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1031/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=197,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1032/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=198,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1033/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=198,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1034/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=198,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1035/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=198,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1036/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=198,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1037/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=199,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1038/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=199,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1039/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=199,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1040/500000]
+ optim/total_grad_norm=7.956
+ train/ActionNoiseL2Loss=0.1763
+ throughput/total_tokens=199,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1041/500000]
+ train/ActionNoiseL2Loss=0.1552
+ throughput/total_tokens=199,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1042/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=200,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1043/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=200,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1044/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=200,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1045/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=200,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1046/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=200,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1047/500000]
+ train/ActionNoiseL2Loss=0.1978
+ throughput/total_tokens=201,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1048/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=201,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1049/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=201,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1050/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=201,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1051/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=201,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1052/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=201,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1053/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=202,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1054/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=202,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1055/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=202,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1056/500000]
+ train/ActionNoiseL2Loss=0.1816
+ throughput/total_tokens=202,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1057/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=202,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1058/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=203,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1059/500000]
+ train/ActionNoiseL2Loss=0.1963
+ throughput/total_tokens=203,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1060/500000]
+ optim/total_grad_norm=5.899
+ train/ActionNoiseL2Loss=0.1713
+ throughput/total_tokens=203,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1061/500000]
+ train/ActionNoiseL2Loss=0.1722
+ throughput/total_tokens=203,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1062/500000]
+ train/ActionNoiseL2Loss=0.2153
+ throughput/total_tokens=203,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1063/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=204,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1064/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=204,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1065/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=204,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1066/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=204,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1067/500000]
+ train/ActionNoiseL2Loss=0.2411
+ throughput/total_tokens=204,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1068/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=205,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1069/500000]
+ train/ActionNoiseL2Loss=0.2505
+ throughput/total_tokens=205,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1070/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=205,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1071/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=205,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1072/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=205,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1073/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=206,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1074/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=206,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1075/500000]
+ train/ActionNoiseL2Loss=0.1609
+ throughput/total_tokens=206,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1076/500000]
+ train/ActionNoiseL2Loss=0.1364
+ throughput/total_tokens=206,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1077/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=206,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1078/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=206,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1079/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=207,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1080/500000]
+ optim/total_grad_norm=5.487
+ train/ActionNoiseL2Loss=0.1831
+ throughput/total_tokens=207,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1081/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=207,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1082/500000]
+ train/ActionNoiseL2Loss=0.1532
+ throughput/total_tokens=207,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1083/500000]
+ train/ActionNoiseL2Loss=0.1776
+ throughput/total_tokens=207,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1084/500000]
+ train/ActionNoiseL2Loss=0.1476
+ throughput/total_tokens=208,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1085/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=208,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1086/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=208,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1087/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=208,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1088/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=208,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1089/500000]
+ train/ActionNoiseL2Loss=0.1516
+ throughput/total_tokens=209,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1090/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=209,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1091/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=209,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1092/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=209,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1093/500000]
+ train/ActionNoiseL2Loss=0.1475
+ throughput/total_tokens=209,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1094/500000]
+ train/ActionNoiseL2Loss=0.2118
+ throughput/total_tokens=210,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1095/500000]
+ train/ActionNoiseL2Loss=0.1665
+ throughput/total_tokens=210,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1096/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=210,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1097/500000]
+ train/ActionNoiseL2Loss=0.1584
+ throughput/total_tokens=210,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1098/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=210,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1099/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=211,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1100/500000]
+ optim/total_grad_norm=3.531
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=211,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1101/500000]
+ train/ActionNoiseL2Loss=0.1947
+ throughput/total_tokens=211,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1102/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=211,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1103/500000]
+ train/ActionNoiseL2Loss=0.1841
+ throughput/total_tokens=211,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1104/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=211,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1105/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=212,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1106/500000]
+ train/ActionNoiseL2Loss=0.3729
+ throughput/total_tokens=212,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1107/500000]
+ train/ActionNoiseL2Loss=0.1484
+ throughput/total_tokens=212,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1108/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=212,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1109/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=212,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1110/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=213,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1111/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=213,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1112/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=213,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1113/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=213,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1114/500000]
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=213,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1115/500000]
+ train/ActionNoiseL2Loss=0.1654
+ throughput/total_tokens=214,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1116/500000]
+ train/ActionNoiseL2Loss=0.2396
+ throughput/total_tokens=214,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1117/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=214,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1118/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=214,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1119/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=214,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1120/500000]
+ optim/total_grad_norm=4.674
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=215,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1121/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=215,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1122/500000]
+ train/ActionNoiseL2Loss=0.1422
+ throughput/total_tokens=215,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1123/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=215,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1124/500000]
+ train/ActionNoiseL2Loss=0.2469
+ throughput/total_tokens=215,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1125/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=216,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1126/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=216,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1127/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=216,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1128/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=216,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1129/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=216,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1130/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=216,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1131/500000]
+ train/ActionNoiseL2Loss=0.2018
+ throughput/total_tokens=217,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1132/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=217,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1133/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=217,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1134/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=217,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1135/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=217,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1136/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=218,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1137/500000]
+ train/ActionNoiseL2Loss=0.1280
+ throughput/total_tokens=218,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1138/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=218,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1139/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=218,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1140/500000]
+ optim/total_grad_norm=8.092
+ train/ActionNoiseL2Loss=0.2361
+ throughput/total_tokens=218,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1141/500000]
+ train/ActionNoiseL2Loss=0.3073
+ throughput/total_tokens=219,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1142/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=219,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1143/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=219,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1144/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=219,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1145/500000]
+ train/ActionNoiseL2Loss=0.2561
+ throughput/total_tokens=219,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1146/500000]
+ train/ActionNoiseL2Loss=0.2207
+ throughput/total_tokens=220,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1147/500000]
+ train/ActionNoiseL2Loss=0.2180
+ throughput/total_tokens=220,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1148/500000]
+ train/ActionNoiseL2Loss=0.2462
+ throughput/total_tokens=220,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1149/500000]
+ train/ActionNoiseL2Loss=0.2231
+ throughput/total_tokens=220,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1150/500000]
+ train/ActionNoiseL2Loss=0.1308
+ throughput/total_tokens=220,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1151/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=220,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1152/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=221,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1153/500000]
+ train/ActionNoiseL2Loss=0.1984
+ throughput/total_tokens=221,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1154/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=221,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1155/500000]
+ train/ActionNoiseL2Loss=0.2136
+ throughput/total_tokens=221,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1156/500000]
+ train/ActionNoiseL2Loss=0.2237
+ throughput/total_tokens=221,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1157/500000]
+ train/ActionNoiseL2Loss=0.1885
+ throughput/total_tokens=222,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1158/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=222,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1159/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=222,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1160/500000]
+ optim/total_grad_norm=3.534
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=222,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1161/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=222,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1162/500000]
+ train/ActionNoiseL2Loss=0.1768
+ throughput/total_tokens=223,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1163/500000]
+ train/ActionNoiseL2Loss=0.1740
+ throughput/total_tokens=223,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1164/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=223,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1165/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=223,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1166/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=223,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1167/500000]
+ train/ActionNoiseL2Loss=0.1963
+ throughput/total_tokens=224,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1168/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=224,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1169/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=224,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1170/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=224,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1171/500000]
+ train/ActionNoiseL2Loss=0.4028
+ throughput/total_tokens=224,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1172/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=225,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1173/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=225,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1174/500000]
+ train/ActionNoiseL2Loss=0.1860
+ throughput/total_tokens=225,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1175/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=225,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1176/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=225,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1177/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=225,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1178/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=226,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1179/500000]
+ train/ActionNoiseL2Loss=0.1843
+ throughput/total_tokens=226,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1180/500000]
+ optim/total_grad_norm=5.323
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=226,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1181/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=226,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1182/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=226,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1183/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=227,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1184/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=227,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1185/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=227,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1186/500000]
+ train/ActionNoiseL2Loss=0.2253
+ throughput/total_tokens=227,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1187/500000]
+ train/ActionNoiseL2Loss=0.1457
+ throughput/total_tokens=227,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1188/500000]
+ train/ActionNoiseL2Loss=0.2355
+ throughput/total_tokens=228,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1189/500000]
+ train/ActionNoiseL2Loss=0.1650
+ throughput/total_tokens=228,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1190/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=228,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1191/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=228,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1192/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=228,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1193/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=229,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1194/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=229,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1195/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=229,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1196/500000]
+ train/ActionNoiseL2Loss=0.1457
+ throughput/total_tokens=229,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1197/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=229,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1198/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=230,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1199/500000]
+ train/ActionNoiseL2Loss=0.1545
+ throughput/total_tokens=230,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1200/500000]
+ optim/total_grad_norm=5.239
+ train/ActionNoiseL2Loss=0.1611
+ throughput/total_tokens=230,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1201/500000]
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=230,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1202/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=230,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1203/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=230,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1204/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=231,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1205/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=231,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1206/500000]
+ train/ActionNoiseL2Loss=0.1740
+ throughput/total_tokens=231,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1207/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=231,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1208/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=231,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1209/500000]
+ train/ActionNoiseL2Loss=0.1538
+ throughput/total_tokens=232,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1210/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=232,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1211/500000]
+ train/ActionNoiseL2Loss=0.2270
+ throughput/total_tokens=232,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1212/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=232,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1213/500000]
+ train/ActionNoiseL2Loss=0.2131
+ throughput/total_tokens=232,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1214/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=233,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1215/500000]
+ train/ActionNoiseL2Loss=0.1879
+ throughput/total_tokens=233,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1216/500000]
+ train/ActionNoiseL2Loss=0.2432
+ throughput/total_tokens=233,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1217/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=233,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1218/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=233,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1219/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=234,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1220/500000]
+ optim/total_grad_norm=3.107
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=234,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1221/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=234,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1222/500000]
+ train/ActionNoiseL2Loss=0.2064
+ throughput/total_tokens=234,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1223/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=234,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1224/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=235,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1225/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=235,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1226/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=235,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1227/500000]
+ train/ActionNoiseL2Loss=0.1794
+ throughput/total_tokens=235,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1228/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=235,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1229/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=235,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1230/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=236,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1231/500000]
+ train/ActionNoiseL2Loss=0.1450
+ throughput/total_tokens=236,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1232/500000]
+ train/ActionNoiseL2Loss=0.1887
+ throughput/total_tokens=236,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1233/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=236,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1234/500000]
+ train/ActionNoiseL2Loss=0.2180
+ throughput/total_tokens=236,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1235/500000]
+ train/ActionNoiseL2Loss=0.1611
+ throughput/total_tokens=237,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1236/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=237,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1237/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=237,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1238/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=237,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1239/500000]
+ train/ActionNoiseL2Loss=0.1373
+ throughput/total_tokens=237,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1240/500000]
+ optim/total_grad_norm=5.065
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=238,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1241/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=238,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1242/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=238,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1243/500000]
+ train/ActionNoiseL2Loss=0.1736
+ throughput/total_tokens=238,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1244/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=238,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1245/500000]
+ train/ActionNoiseL2Loss=0.1608
+ throughput/total_tokens=239,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1246/500000]
+ train/ActionNoiseL2Loss=0.1410
+ throughput/total_tokens=239,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1247/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=239,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1248/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=239,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1249/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=239,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1250/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=240,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1251/500000]
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=240,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1252/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=240,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1253/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=240,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1254/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=240,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1255/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=240,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1256/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=241,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1257/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=241,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1258/500000]
+ train/ActionNoiseL2Loss=0.1680
+ throughput/total_tokens=241,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1259/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=241,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1260/500000]
+ optim/total_grad_norm=5.918
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=241,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1261/500000]
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=242,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1262/500000]
+ train/ActionNoiseL2Loss=0.1897
+ throughput/total_tokens=242,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1263/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=242,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1264/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=242,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1265/500000]
+ train/ActionNoiseL2Loss=0.1419
+ throughput/total_tokens=242,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1266/500000]
+ train/ActionNoiseL2Loss=0.1264
+ throughput/total_tokens=243,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1267/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=243,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1268/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=243,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1269/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=243,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1270/500000]
+ train/ActionNoiseL2Loss=0.1828
+ throughput/total_tokens=243,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1271/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=244,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1272/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=244,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1273/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=244,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1274/500000]
+ train/ActionNoiseL2Loss=0.1919
+ throughput/total_tokens=244,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1275/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=244,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1276/500000]
+ train/ActionNoiseL2Loss=0.1662
+ throughput/total_tokens=244,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1277/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=245,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1278/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=245,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1279/500000]
+ train/ActionNoiseL2Loss=0.1598
+ throughput/total_tokens=245,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1280/500000]
+ optim/total_grad_norm=3.625
+ train/ActionNoiseL2Loss=0.1468
+ throughput/total_tokens=245,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1281/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=245,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1282/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=246,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1283/500000]
+ train/ActionNoiseL2Loss=0.1652
+ throughput/total_tokens=246,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1284/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=246,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1285/500000]
+ train/ActionNoiseL2Loss=0.1533
+ throughput/total_tokens=246,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1286/500000]
+ train/ActionNoiseL2Loss=0.2070
+ throughput/total_tokens=246,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1287/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=247,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1288/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=247,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1289/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=247,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1290/500000]
+ train/ActionNoiseL2Loss=0.1442
+ throughput/total_tokens=247,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1291/500000]
+ train/ActionNoiseL2Loss=0.1963
+ throughput/total_tokens=247,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1292/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=248,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1293/500000]
+ train/ActionNoiseL2Loss=0.2401
+ throughput/total_tokens=248,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1294/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=248,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1295/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=248,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1296/500000]
+ train/ActionNoiseL2Loss=0.1856
+ throughput/total_tokens=248,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1297/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=249,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1298/500000]
+ train/ActionNoiseL2Loss=0.2050
+ throughput/total_tokens=249,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1299/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=249,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1300/500000]
+ optim/total_grad_norm=3.249
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=249,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1301/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=249,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1302/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=249,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1303/500000]
+ train/ActionNoiseL2Loss=0.1598
+ throughput/total_tokens=250,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1304/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=250,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1305/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=250,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1306/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=250,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1307/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=250,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1308/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=251,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1309/500000]
+ train/ActionNoiseL2Loss=0.1177
+ throughput/total_tokens=251,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1310/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=251,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1311/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=251,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1312/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=251,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1313/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=252,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1314/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=252,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1315/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=252,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1316/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=252,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1317/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=252,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1318/500000]
+ train/ActionNoiseL2Loss=0.2180
+ throughput/total_tokens=253,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1319/500000]
+ train/ActionNoiseL2Loss=0.1561
+ throughput/total_tokens=253,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1320/500000]
+ optim/total_grad_norm=3.827
+ train/ActionNoiseL2Loss=0.1486
+ throughput/total_tokens=253,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1321/500000]
+ train/ActionNoiseL2Loss=0.1905
+ throughput/total_tokens=253,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1322/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=253,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1323/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=254,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1324/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=254,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1325/500000]
+ train/ActionNoiseL2Loss=0.1644
+ throughput/total_tokens=254,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1326/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=254,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1327/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=254,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1328/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=254,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1329/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=255,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1330/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=255,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1331/500000]
+ train/ActionNoiseL2Loss=0.1542
+ throughput/total_tokens=255,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1332/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=255,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1333/500000]
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=255,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1334/500000]
+ train/ActionNoiseL2Loss=0.1459
+ throughput/total_tokens=256,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1335/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=256,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1336/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=256,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1337/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=256,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1338/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=256,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1339/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=257,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1340/500000]
+ optim/total_grad_norm=2.816
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=257,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1341/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=257,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1342/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=257,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1343/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=257,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1344/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=258,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1345/500000]
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=258,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1346/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=258,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1347/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=258,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1348/500000]
+ train/ActionNoiseL2Loss=0.2401
+ throughput/total_tokens=258,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1349/500000]
+ train/ActionNoiseL2Loss=0.1609
+ throughput/total_tokens=259,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1350/500000]
+ train/ActionNoiseL2Loss=0.2275
+ throughput/total_tokens=259,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1351/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=259,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1352/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=259,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1353/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=259,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1354/500000]
+ train/ActionNoiseL2Loss=0.2056
+ throughput/total_tokens=259,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1355/500000]
+ train/ActionNoiseL2Loss=0.2698
+ throughput/total_tokens=260,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1356/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=260,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1357/500000]
+ train/ActionNoiseL2Loss=0.1484
+ throughput/total_tokens=260,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1358/500000]
+ train/ActionNoiseL2Loss=0.1896
+ throughput/total_tokens=260,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1359/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=260,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1360/500000]
+ optim/total_grad_norm=3.854
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=261,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1361/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=261,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1362/500000]
+ train/ActionNoiseL2Loss=0.2279
+ throughput/total_tokens=261,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1363/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=261,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1364/500000]
+ train/ActionNoiseL2Loss=0.1249
+ throughput/total_tokens=261,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1365/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=262,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1366/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=262,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1367/500000]
+ train/ActionNoiseL2Loss=0.1773
+ throughput/total_tokens=262,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1368/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=262,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1369/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=262,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1370/500000]
+ train/ActionNoiseL2Loss=0.2686
+ throughput/total_tokens=263,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1371/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=263,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1372/500000]
+ train/ActionNoiseL2Loss=0.2113
+ throughput/total_tokens=263,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1373/500000]
+ train/ActionNoiseL2Loss=0.1872
+ throughput/total_tokens=263,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1374/500000]
+ train/ActionNoiseL2Loss=0.1867
+ throughput/total_tokens=263,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1375/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=264,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1376/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=264,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1377/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=264,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1378/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=264,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1379/500000]
+ train/ActionNoiseL2Loss=0.1434
+ throughput/total_tokens=264,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1380/500000]
+ optim/total_grad_norm=4.485
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=264,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1381/500000]
+ train/ActionNoiseL2Loss=0.1602
+ throughput/total_tokens=265,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1382/500000]
+ train/ActionNoiseL2Loss=0.2571
+ throughput/total_tokens=265,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1383/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=265,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1384/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=265,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1385/500000]
+ train/ActionNoiseL2Loss=0.1652
+ throughput/total_tokens=265,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1386/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=266,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1387/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=266,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1388/500000]
+ train/ActionNoiseL2Loss=0.2146
+ throughput/total_tokens=266,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1389/500000]
+ train/ActionNoiseL2Loss=0.1571
+ throughput/total_tokens=266,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1390/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=266,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1391/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=267,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1392/500000]
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=267,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1393/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=267,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1394/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=267,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1395/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=267,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1396/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=268,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1397/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=268,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1398/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=268,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1399/500000]
+ train/ActionNoiseL2Loss=0.1523
+ throughput/total_tokens=268,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1400/500000]
+ optim/total_grad_norm=2.819
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=268,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1401/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=268,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1402/500000]
+ train/ActionNoiseL2Loss=0.1295
+ throughput/total_tokens=269,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1403/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=269,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1404/500000]
+ train/ActionNoiseL2Loss=0.1561
+ throughput/total_tokens=269,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1405/500000]
+ train/ActionNoiseL2Loss=0.1814
+ throughput/total_tokens=269,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1406/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=269,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1407/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=270,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1408/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=270,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1409/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=270,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1410/500000]
+ train/ActionNoiseL2Loss=0.2167
+ throughput/total_tokens=270,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1411/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=270,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1412/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=271,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1413/500000]
+ train/ActionNoiseL2Loss=0.2339
+ throughput/total_tokens=271,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1414/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=271,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1415/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=271,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1416/500000]
+ train/ActionNoiseL2Loss=0.1552
+ throughput/total_tokens=271,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1417/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=272,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1418/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=272,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1419/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=272,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1420/500000]
+ optim/total_grad_norm=4.916
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=272,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1421/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=272,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1422/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=273,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1423/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=273,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1424/500000]
+ train/ActionNoiseL2Loss=0.2039
+ throughput/total_tokens=273,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1425/500000]
+ train/ActionNoiseL2Loss=0.1849
+ throughput/total_tokens=273,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1426/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=273,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1427/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=273,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1428/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=274,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1429/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=274,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1430/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=274,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1431/500000]
+ train/ActionNoiseL2Loss=0.1408
+ throughput/total_tokens=274,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1432/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=274,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1433/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=275,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1434/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=275,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1435/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=275,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1436/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=275,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1437/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=275,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1438/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=276,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1439/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=276,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1440/500000]
+ optim/total_grad_norm=4.110
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=276,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1441/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=276,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1442/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=276,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1443/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=277,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1444/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=277,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1445/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=277,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1446/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=277,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1447/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=277,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1448/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=278,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1449/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=278,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1450/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=278,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1451/500000]
+ train/ActionNoiseL2Loss=0.1913
+ throughput/total_tokens=278,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1452/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=278,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1453/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=278,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1454/500000]
+ train/ActionNoiseL2Loss=0.2272
+ throughput/total_tokens=279,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1455/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=279,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1456/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=279,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1457/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=279,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1458/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=279,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1459/500000]
+ train/ActionNoiseL2Loss=0.1749
+ throughput/total_tokens=280,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1460/500000]
+ optim/total_grad_norm=5.146
+ train/ActionNoiseL2Loss=0.1623
+ throughput/total_tokens=280,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1461/500000]
+ train/ActionNoiseL2Loss=0.1888
+ throughput/total_tokens=280,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1462/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=280,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1463/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=280,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1464/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=281,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1465/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=281,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1466/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=281,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1467/500000]
+ train/ActionNoiseL2Loss=0.1479
+ throughput/total_tokens=281,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1468/500000]
+ train/ActionNoiseL2Loss=0.1424
+ throughput/total_tokens=281,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1469/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=282,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1470/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=282,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1471/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=282,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1472/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=282,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1473/500000]
+ train/ActionNoiseL2Loss=0.1713
+ throughput/total_tokens=282,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1474/500000]
+ train/ActionNoiseL2Loss=0.1640
+ throughput/total_tokens=283,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1475/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=283,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1476/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=283,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1477/500000]
+ train/ActionNoiseL2Loss=0.1559
+ throughput/total_tokens=283,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1478/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=283,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1479/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=283,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1480/500000]
+ optim/total_grad_norm=3.211
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=284,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1481/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=284,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1482/500000]
+ train/ActionNoiseL2Loss=0.1596
+ throughput/total_tokens=284,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1483/500000]
+ train/ActionNoiseL2Loss=0.1372
+ throughput/total_tokens=284,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1484/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=284,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1485/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=285,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1486/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=285,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1487/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=285,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1488/500000]
+ train/ActionNoiseL2Loss=0.1486
+ throughput/total_tokens=285,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1489/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=285,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1490/500000]
+ train/ActionNoiseL2Loss=0.1379
+ throughput/total_tokens=286,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1491/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=286,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1492/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=286,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1493/500000]
+ train/ActionNoiseL2Loss=0.1648
+ throughput/total_tokens=286,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1494/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=286,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1495/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=287,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1496/500000]
+ train/ActionNoiseL2Loss=0.1656
+ throughput/total_tokens=287,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1497/500000]
+ train/ActionNoiseL2Loss=0.1507
+ throughput/total_tokens=287,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1498/500000]
+ train/ActionNoiseL2Loss=0.1587
+ throughput/total_tokens=287,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1499/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=287,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1500/500000]
+ optim/total_grad_norm=3.375
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=288,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/03 [01:29:20] INFO | >> Saving config... checkpoint.py:608
+10/03 [01:30:00] INFO | >> Saving model state... checkpoint.py:796
+10/03 [01:31:10] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [01:32:43] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1501/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=288,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1502/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=288,384,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=1503/500000]
+ train/ActionNoiseL2Loss=0.2642
+ throughput/total_tokens=288,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=1504/500000]
+ train/ActionNoiseL2Loss=0.2599
+ throughput/total_tokens=288,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=1505/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=288,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=1506/500000]
+ train/ActionNoiseL2Loss=0.2406
+ throughput/total_tokens=289,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1507/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=289,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=1508/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=289,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1509/500000]
+ train/ActionNoiseL2Loss=0.1561
+ throughput/total_tokens=289,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1510/500000]
+ train/ActionNoiseL2Loss=0.1996
+ throughput/total_tokens=289,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=1511/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=290,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1512/500000]
+ train/ActionNoiseL2Loss=0.1481
+ throughput/total_tokens=290,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1513/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=290,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=1514/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=290,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1515/500000]
+ train/ActionNoiseL2Loss=0.1995
+ throughput/total_tokens=290,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1516/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=291,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1517/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=291,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1518/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=291,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1519/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=291,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1520/500000]
+ optim/total_grad_norm=2.594
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=291,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1521/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=292,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1522/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=292,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1523/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=292,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1524/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=292,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1525/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=292,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1526/500000]
+ train/ActionNoiseL2Loss=0.1622
+ throughput/total_tokens=292,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1527/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=293,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1528/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=293,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1529/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=293,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1530/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=293,760,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1531/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=293,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1532/500000]
+ train/ActionNoiseL2Loss=0.2032
+ throughput/total_tokens=294,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1533/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=294,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1534/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=294,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1535/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=294,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1536/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=294,912,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1537/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=295,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1538/500000]
+ train/ActionNoiseL2Loss=0.1681
+ throughput/total_tokens=295,296,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=1539/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=295,488,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=1540/500000]
+ optim/total_grad_norm=2.132
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=295,680,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1541/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=295,872,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1542/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=296,064,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1543/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=296,256,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1544/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=296,448,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1545/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=296,640,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1546/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=296,832,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1547/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=297,024,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1548/500000]
+ train/ActionNoiseL2Loss=0.1372
+ throughput/total_tokens=297,216,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1549/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=297,408,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=1550/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=297,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1551/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=297,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1552/500000]
+ train/ActionNoiseL2Loss=0.1718
+ throughput/total_tokens=297,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1553/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=298,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1554/500000]
+ train/ActionNoiseL2Loss=0.1657
+ throughput/total_tokens=298,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1555/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=298,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1556/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=298,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1557/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=298,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1558/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=299,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1559/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=299,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1560/500000]
+ optim/total_grad_norm=3.102
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=299,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1561/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=299,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1562/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=299,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1563/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=300,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1564/500000]
+ train/ActionNoiseL2Loss=0.1446
+ throughput/total_tokens=300,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1565/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=300,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1566/500000]
+ train/ActionNoiseL2Loss=0.1678
+ throughput/total_tokens=300,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1567/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=300,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1568/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=301,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1569/500000]
+ train/ActionNoiseL2Loss=0.1548
+ throughput/total_tokens=301,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1570/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=301,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1571/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=301,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1572/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=301,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1573/500000]
+ train/ActionNoiseL2Loss=0.1218
+ throughput/total_tokens=302,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1574/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=302,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1575/500000]
+ train/ActionNoiseL2Loss=0.2964
+ throughput/total_tokens=302,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1576/500000]
+ train/ActionNoiseL2Loss=0.1773
+ throughput/total_tokens=302,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1577/500000]
+ train/ActionNoiseL2Loss=0.2033
+ throughput/total_tokens=302,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1578/500000]
+ train/ActionNoiseL2Loss=0.1553
+ throughput/total_tokens=302,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1579/500000]
+ train/ActionNoiseL2Loss=0.1716
+ throughput/total_tokens=303,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1580/500000]
+ optim/total_grad_norm=3.993
+ train/ActionNoiseL2Loss=0.1955
+ throughput/total_tokens=303,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1581/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=303,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1582/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=303,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1583/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=303,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1584/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=304,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1585/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=304,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1586/500000]
+ train/ActionNoiseL2Loss=0.1538
+ throughput/total_tokens=304,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1587/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=304,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1588/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=304,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1589/500000]
+ train/ActionNoiseL2Loss=0.1642
+ throughput/total_tokens=305,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1590/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=305,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1591/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=305,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1592/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=305,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1593/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=305,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1594/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=306,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1595/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=306,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1596/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=306,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1597/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=306,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1598/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=306,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1599/500000]
+ train/ActionNoiseL2Loss=0.1843
+ throughput/total_tokens=307,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1600/500000]
+ optim/total_grad_norm=3.441
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=307,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1601/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=307,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1602/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=307,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1603/500000]
+ train/ActionNoiseL2Loss=0.1505
+ throughput/total_tokens=307,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1604/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=307,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1605/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=308,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1606/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=308,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1607/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=308,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1608/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=308,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1609/500000]
+ train/ActionNoiseL2Loss=0.1337
+ throughput/total_tokens=308,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1610/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=309,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1611/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=309,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1612/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=309,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1613/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=309,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1614/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=309,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1615/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=310,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1616/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=310,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1617/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=310,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1618/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=310,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1619/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=310,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1620/500000]
+ optim/total_grad_norm=2.440
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=311,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1621/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=311,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1622/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=311,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1623/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=311,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1624/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=311,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1625/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=312,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1626/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=312,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1627/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=312,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1628/500000]
+ train/ActionNoiseL2Loss=0.1941
+ throughput/total_tokens=312,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1629/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=312,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1630/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=312,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1631/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=313,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1632/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=313,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1633/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=313,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1634/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=313,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1635/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=313,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1636/500000]
+ train/ActionNoiseL2Loss=0.1935
+ throughput/total_tokens=314,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1637/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=314,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1638/500000]
+ train/ActionNoiseL2Loss=0.2375
+ throughput/total_tokens=314,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1639/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=314,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1640/500000]
+ optim/total_grad_norm=3.574
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=314,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1641/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=315,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1642/500000]
+ train/ActionNoiseL2Loss=0.1821
+ throughput/total_tokens=315,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1643/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=315,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1644/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=315,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1645/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=315,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1646/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=316,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1647/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=316,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1648/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=316,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1649/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=316,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1650/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=316,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1651/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=316,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1652/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=317,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1653/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=317,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1654/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=317,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1655/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=317,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1656/500000]
+ train/ActionNoiseL2Loss=0.1930
+ throughput/total_tokens=317,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1657/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=318,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1658/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=318,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1659/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=318,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1660/500000]
+ optim/total_grad_norm=2.512
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=318,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1661/500000]
+ train/ActionNoiseL2Loss=0.1922
+ throughput/total_tokens=318,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1662/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=319,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1663/500000]
+ train/ActionNoiseL2Loss=0.1769
+ throughput/total_tokens=319,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1664/500000]
+ train/ActionNoiseL2Loss=0.1829
+ throughput/total_tokens=319,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1665/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=319,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1666/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=319,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1667/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=320,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1668/500000]
+ train/ActionNoiseL2Loss=0.1822
+ throughput/total_tokens=320,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1669/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=320,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1670/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=320,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1671/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=320,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1672/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=321,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1673/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=321,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1674/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=321,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1675/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=321,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1676/500000]
+ train/ActionNoiseL2Loss=0.1540
+ throughput/total_tokens=321,792,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1677/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=321,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1678/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=322,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1679/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=322,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1680/500000]
+ optim/total_grad_norm=3.393
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=322,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1681/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=322,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1682/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=322,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1683/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=323,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1684/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=323,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1685/500000]
+ train/ActionNoiseL2Loss=0.1470
+ throughput/total_tokens=323,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1686/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=323,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1687/500000]
+ train/ActionNoiseL2Loss=0.1393
+ throughput/total_tokens=323,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1688/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=324,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1689/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=324,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1690/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=324,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1691/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=324,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1692/500000]
+ train/ActionNoiseL2Loss=0.1316
+ throughput/total_tokens=324,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1693/500000]
+ train/ActionNoiseL2Loss=0.1717
+ throughput/total_tokens=325,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1694/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=325,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1695/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=325,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1696/500000]
+ train/ActionNoiseL2Loss=0.1317
+ throughput/total_tokens=325,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1697/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=325,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1698/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=326,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1699/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=326,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1700/500000]
+ optim/total_grad_norm=4.113
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=326,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1701/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=326,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1702/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=326,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1703/500000]
+ train/ActionNoiseL2Loss=0.1257
+ throughput/total_tokens=326,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1704/500000]
+ train/ActionNoiseL2Loss=0.1827
+ throughput/total_tokens=327,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1705/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=327,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1706/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=327,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1707/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=327,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1708/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=327,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1709/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=328,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1710/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=328,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1711/500000]
+ train/ActionNoiseL2Loss=0.1356
+ throughput/total_tokens=328,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1712/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=328,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1713/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=328,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1714/500000]
+ train/ActionNoiseL2Loss=0.2482
+ throughput/total_tokens=329,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1715/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=329,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1716/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=329,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1717/500000]
+ train/ActionNoiseL2Loss=0.1364
+ throughput/total_tokens=329,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1718/500000]
+ train/ActionNoiseL2Loss=0.1337
+ throughput/total_tokens=329,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1719/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=330,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1720/500000]
+ optim/total_grad_norm=4.323
+ train/ActionNoiseL2Loss=0.1645
+ throughput/total_tokens=330,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1721/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=330,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1722/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=330,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1723/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=330,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1724/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=331,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1725/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=331,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1726/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=331,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1727/500000]
+ train/ActionNoiseL2Loss=0.1435
+ throughput/total_tokens=331,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1728/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=331,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1729/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=331,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1730/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=332,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1731/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=332,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1732/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=332,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1733/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=332,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1734/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=332,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1735/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=333,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1736/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=333,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1737/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=333,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1738/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=333,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1739/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=333,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1740/500000]
+ optim/total_grad_norm=2.185
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=334,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1741/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=334,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1742/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=334,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1743/500000]
+ train/ActionNoiseL2Loss=0.1357
+ throughput/total_tokens=334,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1744/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=334,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1745/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=335,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1746/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=335,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1747/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=335,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1748/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=335,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1749/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=335,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1750/500000]
+ train/ActionNoiseL2Loss=0.1860
+ throughput/total_tokens=336,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1751/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=336,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1752/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=336,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1753/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=336,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1754/500000]
+ train/ActionNoiseL2Loss=0.1743
+ throughput/total_tokens=336,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1755/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=336,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1756/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=337,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1757/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=337,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1758/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=337,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1759/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=337,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1760/500000]
+ optim/total_grad_norm=2.098
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=337,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=1761/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=338,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1762/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=338,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1763/500000]
+ train/ActionNoiseL2Loss=0.1688
+ throughput/total_tokens=338,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1764/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=338,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1765/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=338,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1766/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=339,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1767/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=339,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1768/500000]
+ train/ActionNoiseL2Loss=0.1492
+ throughput/total_tokens=339,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1769/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=339,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1770/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=339,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1771/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=340,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1772/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=340,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1773/500000]
+ train/ActionNoiseL2Loss=0.2150
+ throughput/total_tokens=340,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1774/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=340,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1775/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=340,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1776/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=340,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1777/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=341,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1778/500000]
+ train/ActionNoiseL2Loss=0.1706
+ throughput/total_tokens=341,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1779/500000]
+ train/ActionNoiseL2Loss=0.1810
+ throughput/total_tokens=341,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1780/500000]
+ optim/total_grad_norm=2.918
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=341,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1781/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=341,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1782/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=342,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1783/500000]
+ train/ActionNoiseL2Loss=0.1684
+ throughput/total_tokens=342,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1784/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=342,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1785/500000]
+ train/ActionNoiseL2Loss=0.2107
+ throughput/total_tokens=342,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1786/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=342,912,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1787/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=343,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1788/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=343,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1789/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=343,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1790/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=343,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1791/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=343,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1792/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=344,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1793/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=344,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1794/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=344,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1795/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=344,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1796/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=344,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1797/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=345,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1798/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=345,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1799/500000]
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=345,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1800/500000]
+ optim/total_grad_norm=2.829
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=345,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1801/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=345,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1802/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=345,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1803/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=346,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1804/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=346,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1805/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=346,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1806/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=346,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1807/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=346,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1808/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=347,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1809/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=347,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1810/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=347,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1811/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=347,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1812/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=347,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1813/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=348,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1814/500000]
+ train/ActionNoiseL2Loss=0.1675
+ throughput/total_tokens=348,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1815/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=348,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1816/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=348,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1817/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=348,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1818/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=349,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1819/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=349,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1820/500000]
+ optim/total_grad_norm=4.416
+ train/ActionNoiseL2Loss=0.1793
+ throughput/total_tokens=349,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1821/500000]
+ train/ActionNoiseL2Loss=0.2030
+ throughput/total_tokens=349,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1822/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=349,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1823/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=350,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1824/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=350,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1825/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=350,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1826/500000]
+ train/ActionNoiseL2Loss=0.2122
+ throughput/total_tokens=350,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1827/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=350,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1828/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=350,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1829/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=351,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1830/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=351,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1831/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=351,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1832/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=351,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1833/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=351,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1834/500000]
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=352,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1835/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=352,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1836/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=352,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1837/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=352,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1838/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=352,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1839/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=353,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1840/500000]
+ optim/total_grad_norm=3.171
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=353,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1841/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=353,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1842/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=353,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1843/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=353,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1844/500000]
+ train/ActionNoiseL2Loss=0.1866
+ throughput/total_tokens=354,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1845/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=354,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1846/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=354,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1847/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=354,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1848/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=354,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1849/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=355,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1850/500000]
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=355,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1851/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=355,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1852/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=355,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1853/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=355,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1854/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=355,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1855/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=356,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1856/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=356,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1857/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=356,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1858/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=356,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1859/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=356,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1860/500000]
+ optim/total_grad_norm=7.171
+ train/ActionNoiseL2Loss=0.1911
+ throughput/total_tokens=357,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=1861/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=357,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1862/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=357,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1863/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=357,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1864/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=357,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1865/500000]
+ train/ActionNoiseL2Loss=0.1433
+ throughput/total_tokens=358,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1866/500000]
+ train/ActionNoiseL2Loss=0.1375
+ throughput/total_tokens=358,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1867/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=358,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1868/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=358,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1869/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=358,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1870/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=359,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1871/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=359,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1872/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=359,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1873/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=359,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1874/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=359,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1875/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=360,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1876/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=360,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1877/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=360,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1878/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=360,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1879/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=360,768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1880/500000]
+ optim/total_grad_norm=1.750
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=360,960,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1881/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=361,152,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1882/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=361,344,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1883/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=361,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1884/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=361,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1885/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=361,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1886/500000]
+ train/ActionNoiseL2Loss=0.1680
+ throughput/total_tokens=362,112,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1887/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=362,304,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1888/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=362,496,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1889/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=362,688,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1890/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=362,880,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1891/500000]
+ train/ActionNoiseL2Loss=0.2151
+ throughput/total_tokens=363,072,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1892/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=363,264,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1893/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=363,456,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1894/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=363,648,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1895/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=363,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1896/500000]
+ train/ActionNoiseL2Loss=0.1681
+ throughput/total_tokens=364,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1897/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=364,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1898/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=364,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1899/500000]
+ train/ActionNoiseL2Loss=0.1620
+ throughput/total_tokens=364,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1900/500000]
+ optim/total_grad_norm=2.187
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=364,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1901/500000]
+ train/ActionNoiseL2Loss=0.2503
+ throughput/total_tokens=364,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1902/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=365,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1903/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=365,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1904/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=365,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1905/500000]
+ train/ActionNoiseL2Loss=0.1443
+ throughput/total_tokens=365,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1906/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=365,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1907/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=366,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1908/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=366,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1909/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=366,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1910/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=366,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1911/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=366,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1912/500000]
+ train/ActionNoiseL2Loss=0.1379
+ throughput/total_tokens=367,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1913/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=367,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1914/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=367,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1915/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=367,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1916/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=367,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1917/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=368,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1918/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=368,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1919/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=368,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1920/500000]
+ optim/total_grad_norm=3.689
+ train/ActionNoiseL2Loss=0.1264
+ throughput/total_tokens=368,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1921/500000]
+ train/ActionNoiseL2Loss=0.1525
+ throughput/total_tokens=368,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1922/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=369,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1923/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=369,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1924/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=369,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1925/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=369,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1926/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=369,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1927/500000]
+ train/ActionNoiseL2Loss=0.1757
+ throughput/total_tokens=369,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1928/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=370,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1929/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=370,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1930/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=370,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1931/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=370,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1932/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=370,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1933/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=371,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1934/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=371,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1935/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=371,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1936/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=371,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1937/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=371,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1938/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=372,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1939/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=372,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1940/500000]
+ optim/total_grad_norm=3.368
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=372,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1941/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=372,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1942/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=372,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1943/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=373,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1944/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=373,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1945/500000]
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=373,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1946/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=373,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1947/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=373,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1948/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=374,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1949/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=374,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=1950/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=374,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1951/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=374,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1952/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=374,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1953/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=374,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1954/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=375,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1955/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=375,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1956/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=375,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1957/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=375,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1958/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=375,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1959/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=376,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1960/500000]
+ optim/total_grad_norm=3.238
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=376,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=1961/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=376,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1962/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=376,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1963/500000]
+ train/ActionNoiseL2Loss=0.1405
+ throughput/total_tokens=376,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1964/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=377,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1965/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=377,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1966/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=377,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1967/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=377,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1968/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=377,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1969/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=378,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1970/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=378,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1971/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=378,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1972/500000]
+ train/ActionNoiseL2Loss=0.2121
+ throughput/total_tokens=378,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1973/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=378,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1974/500000]
+ train/ActionNoiseL2Loss=0.2441
+ throughput/total_tokens=379,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1975/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=379,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1976/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=379,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1977/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=379,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1978/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=379,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1979/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=379,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1980/500000]
+ optim/total_grad_norm=2.117
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=380,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1981/500000]
+ train/ActionNoiseL2Loss=0.1276
+ throughput/total_tokens=380,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1982/500000]
+ train/ActionNoiseL2Loss=0.1276
+ throughput/total_tokens=380,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1983/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=380,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1984/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=380,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1985/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=381,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1986/500000]
+ train/ActionNoiseL2Loss=0.1410
+ throughput/total_tokens=381,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1987/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=381,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1988/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=381,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1989/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=381,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1990/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=382,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=1991/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=382,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1992/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=382,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1993/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=382,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1994/500000]
+ train/ActionNoiseL2Loss=0.1598
+ throughput/total_tokens=382,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1995/500000]
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=383,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1996/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=383,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1997/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=383,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1998/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=383,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=1999/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=383,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2000/500000]
+ optim/total_grad_norm=2.277
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=384,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/03 [04:27:24] INFO | >> Saving config... checkpoint.py:608
+10/03 [04:28:01] INFO | >> Saving model state... checkpoint.py:796
+10/03 [04:29:12] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [04:30:37] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2001/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=384,192,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=2002/500000]
+ train/ActionNoiseL2Loss=0.1249
+ throughput/total_tokens=384,384,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=2003/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=384,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=2004/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=384,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2005/500000]
+ train/ActionNoiseL2Loss=0.1441
+ throughput/total_tokens=384,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2006/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=385,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2007/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=385,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2008/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=385,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2009/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=385,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2010/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=385,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2011/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=386,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2012/500000]
+ train/ActionNoiseL2Loss=0.1847
+ throughput/total_tokens=386,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2013/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=386,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2014/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=386,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2015/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=386,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2016/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=387,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2017/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=387,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2018/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=387,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2019/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=387,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2020/500000]
+ optim/total_grad_norm=3.337
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=387,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2021/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=388,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2022/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=388,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2023/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=388,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2024/500000]
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=388,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2025/500000]
+ train/ActionNoiseL2Loss=0.1369
+ throughput/total_tokens=388,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2026/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=388,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2027/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=389,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2028/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=389,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2029/500000]
+ train/ActionNoiseL2Loss=0.1500
+ throughput/total_tokens=389,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2030/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=389,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2031/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=389,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2032/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=390,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2033/500000]
+ train/ActionNoiseL2Loss=0.1451
+ throughput/total_tokens=390,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2034/500000]
+ train/ActionNoiseL2Loss=0.2378
+ throughput/total_tokens=390,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2035/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=390,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2036/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=390,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2037/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=391,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2038/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=391,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2039/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=391,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2040/500000]
+ optim/total_grad_norm=4.087
+ train/ActionNoiseL2Loss=0.1935
+ throughput/total_tokens=391,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2041/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=391,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2042/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=392,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2043/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=392,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2044/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=392,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2045/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=392,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2046/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=392,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2047/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=393,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2048/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=393,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2049/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=393,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2050/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=393,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2051/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=393,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2052/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=393,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2053/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=394,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2054/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=394,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2055/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=394,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2056/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=394,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2057/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=394,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2058/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=395,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2059/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=395,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2060/500000]
+ optim/total_grad_norm=3.059
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=395,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2061/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=395,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2062/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=395,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2063/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=396,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2064/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=396,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2065/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=396,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2066/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=396,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2067/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=396,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2068/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=397,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2069/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=397,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2070/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=397,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2071/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=397,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2072/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=397,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2073/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=398,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2074/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=398,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2075/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=398,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2076/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=398,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2077/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=398,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2078/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=398,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2079/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=399,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2080/500000]
+ optim/total_grad_norm=1.504
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=399,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2081/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=399,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2082/500000]
+ train/ActionNoiseL2Loss=0.1691
+ throughput/total_tokens=399,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2083/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=399,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2084/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=400,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2085/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=400,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2086/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=400,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2087/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=400,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2088/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=400,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2089/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=401,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2090/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=401,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2091/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=401,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2092/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=401,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2093/500000]
+ train/ActionNoiseL2Loss=0.1516
+ throughput/total_tokens=401,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2094/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=402,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2095/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=402,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2096/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=402,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2097/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=402,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2098/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=402,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2099/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=403,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2100/500000]
+ optim/total_grad_norm=1.096
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=403,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2101/500000]
+ train/ActionNoiseL2Loss=0.1557
+ throughput/total_tokens=403,392,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2102/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=403,584,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2103/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=403,776,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2104/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=403,968,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2105/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=404,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2106/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=404,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2107/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=404,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2108/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=404,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2109/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=404,928,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2110/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=405,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2111/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=405,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2112/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=405,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2113/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=405,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2114/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=405,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2115/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=406,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2116/500000]
+ train/ActionNoiseL2Loss=0.1658
+ throughput/total_tokens=406,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2117/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=406,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2118/500000]
+ train/ActionNoiseL2Loss=0.1640
+ throughput/total_tokens=406,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2119/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=406,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2120/500000]
+ optim/total_grad_norm=2.151
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=407,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2121/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=407,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2122/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=407,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2123/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=407,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2124/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=407,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2125/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=408,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2126/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=408,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2127/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=408,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2128/500000]
+ train/ActionNoiseL2Loss=0.1300
+ throughput/total_tokens=408,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2129/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=408,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2130/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=408,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2131/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=409,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2132/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=409,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2133/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=409,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2134/500000]
+ train/ActionNoiseL2Loss=0.2774
+ throughput/total_tokens=409,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2135/500000]
+ train/ActionNoiseL2Loss=0.2113
+ throughput/total_tokens=409,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2136/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=410,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2137/500000]
+ train/ActionNoiseL2Loss=0.1660
+ throughput/total_tokens=410,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2138/500000]
+ train/ActionNoiseL2Loss=0.1594
+ throughput/total_tokens=410,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2139/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=410,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2140/500000]
+ optim/total_grad_norm=1.996
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=410,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2141/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=411,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2142/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=411,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2143/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=411,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2144/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=411,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2145/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=411,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2146/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=412,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2147/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=412,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2148/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=412,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2149/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=412,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2150/500000]
+ train/ActionNoiseL2Loss=0.2511
+ throughput/total_tokens=412,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2151/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=412,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2152/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=413,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2153/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=413,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2154/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=413,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2155/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=413,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2156/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=413,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2157/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=414,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2158/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=414,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2159/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=414,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2160/500000]
+ optim/total_grad_norm=3.582
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=414,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2161/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=414,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2162/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=415,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2163/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=415,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2164/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=415,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2165/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=415,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2166/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=415,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2167/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=416,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2168/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=416,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2169/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=416,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2170/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=416,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2171/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=416,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2172/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=417,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2173/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=417,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2174/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=417,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2175/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=417,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2176/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=417,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2177/500000]
+ train/ActionNoiseL2Loss=0.2034
+ throughput/total_tokens=417,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2178/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=418,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2179/500000]
+ train/ActionNoiseL2Loss=0.1927
+ throughput/total_tokens=418,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2180/500000]
+ optim/total_grad_norm=2.696
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=418,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2181/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=418,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2182/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=418,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2183/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=419,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2184/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=419,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2185/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=419,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2186/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=419,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2187/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=419,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2188/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=420,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2189/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=420,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2190/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=420,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2191/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=420,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2192/500000]
+ train/ActionNoiseL2Loss=0.1808
+ throughput/total_tokens=420,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2193/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=421,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2194/500000]
+ train/ActionNoiseL2Loss=0.1757
+ throughput/total_tokens=421,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2195/500000]
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=421,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2196/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=421,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2197/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=421,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2198/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=422,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2199/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=422,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2200/500000]
+ optim/total_grad_norm=2.609
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=422,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2201/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=422,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2202/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=422,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2203/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=422,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2204/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=423,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2205/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=423,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2206/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=423,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2207/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=423,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2208/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=423,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2209/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=424,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2210/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=424,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2211/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=424,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2212/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=424,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2213/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=424,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2214/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=425,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2215/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=425,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2216/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=425,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2217/500000]
+ train/ActionNoiseL2Loss=0.1462
+ throughput/total_tokens=425,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2218/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=425,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2219/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=426,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2220/500000]
+ optim/total_grad_norm=2.610
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=426,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2221/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=426,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2222/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=426,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2223/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=426,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2224/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=427,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2225/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=427,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2226/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=427,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2227/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=427,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2228/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=427,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2229/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=427,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2230/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=428,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2231/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=428,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2232/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=428,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2233/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=428,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2234/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=428,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2235/500000]
+ train/ActionNoiseL2Loss=0.1476
+ throughput/total_tokens=429,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2236/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=429,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2237/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=429,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2238/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=429,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2239/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=429,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2240/500000]
+ optim/total_grad_norm=2.616
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=430,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2241/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=430,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2242/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=430,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2243/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=430,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2244/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=430,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2245/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=431,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2246/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=431,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2247/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=431,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2248/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=431,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2249/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=431,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2250/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=432,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2251/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=432,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2252/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=432,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2253/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=432,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2254/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=432,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2255/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=432,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2256/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=433,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2257/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=433,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2258/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=433,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2259/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=433,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2260/500000]
+ optim/total_grad_norm=2.216
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=433,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2261/500000]
+ train/ActionNoiseL2Loss=0.1686
+ throughput/total_tokens=434,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2262/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=434,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2263/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=434,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2264/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=434,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2265/500000]
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=434,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2266/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=435,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2267/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=435,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2268/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=435,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2269/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=435,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2270/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=435,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2271/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=436,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2272/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=436,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2273/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=436,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2274/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=436,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2275/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=436,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2276/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=436,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2277/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=437,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2278/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=437,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2279/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=437,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2280/500000]
+ optim/total_grad_norm=1.746
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=437,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2281/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=437,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2282/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=438,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2283/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=438,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2284/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=438,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2285/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=438,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2286/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=438,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2287/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=439,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2288/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=439,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2289/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=439,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2290/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=439,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2291/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=439,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2292/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=440,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2293/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=440,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2294/500000]
+ train/ActionNoiseL2Loss=0.1351
+ throughput/total_tokens=440,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2295/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=440,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2296/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=440,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2297/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=441,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2298/500000]
+ train/ActionNoiseL2Loss=0.1367
+ throughput/total_tokens=441,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2299/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=441,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2300/500000]
+ optim/total_grad_norm=1.794
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=441,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2301/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=441,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2302/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=441,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2303/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=442,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2304/500000]
+ train/ActionNoiseL2Loss=0.1715
+ throughput/total_tokens=442,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2305/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=442,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2306/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=442,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2307/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=442,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2308/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=443,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2309/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=443,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2310/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=443,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2311/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=443,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2312/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=443,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2313/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=444,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2314/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=444,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2315/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=444,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2316/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=444,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2317/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=444,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2318/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=445,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2319/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=445,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2320/500000]
+ optim/total_grad_norm=1.447
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=445,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2321/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=445,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2322/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=445,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2323/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=446,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2324/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=446,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2325/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=446,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2326/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=446,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2327/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=446,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2328/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=446,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2329/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=447,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2330/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=447,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2331/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=447,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2332/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=447,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2333/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=447,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2334/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=448,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2335/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=448,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2336/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=448,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2337/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=448,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2338/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=448,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2339/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=449,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2340/500000]
+ optim/total_grad_norm=2.786
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=449,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2341/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=449,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2342/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=449,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2343/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=449,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2344/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=450,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2345/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=450,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2346/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=450,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2347/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=450,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2348/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=450,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2349/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=451,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2350/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=451,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2351/500000]
+ train/ActionNoiseL2Loss=0.1549
+ throughput/total_tokens=451,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2352/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=451,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2353/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=451,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2354/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=451,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2355/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=452,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2356/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=452,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2357/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=452,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2358/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=452,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2359/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=452,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2360/500000]
+ optim/total_grad_norm=2.315
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=453,120,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2361/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=453,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2362/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=453,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2363/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=453,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2364/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=453,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2365/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=454,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2366/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=454,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2367/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=454,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2368/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=454,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2369/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=454,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2370/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=455,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2371/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=455,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2372/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=455,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2373/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=455,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2374/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=455,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2375/500000]
+ train/ActionNoiseL2Loss=0.1484
+ throughput/total_tokens=456,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2376/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=456,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2377/500000]
+ train/ActionNoiseL2Loss=0.1765
+ throughput/total_tokens=456,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2378/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=456,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2379/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=456,768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2380/500000]
+ optim/total_grad_norm=2.703
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=456,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2381/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=457,152,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2382/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=457,344,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2383/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=457,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2384/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=457,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2385/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=457,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2386/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=458,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2387/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=458,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2388/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=458,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2389/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=458,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2390/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=458,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2391/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=459,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2392/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=459,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2393/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=459,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2394/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=459,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2395/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=459,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2396/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=460,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2397/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=460,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2398/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=460,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2399/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=460,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2400/500000]
+ optim/total_grad_norm=2.522
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=460,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2401/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=460,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2402/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=461,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2403/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=461,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2404/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=461,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2405/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=461,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2406/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=461,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2407/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=462,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2408/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=462,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2409/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=462,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2410/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=462,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=2411/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=462,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2412/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=463,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2413/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=463,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2414/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=463,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2415/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=463,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2416/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=463,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2417/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=464,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2418/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=464,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2419/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=464,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2420/500000]
+ optim/total_grad_norm=3.221
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=464,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2421/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=464,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2422/500000]
+ train/ActionNoiseL2Loss=0.1567
+ throughput/total_tokens=465,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2423/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=465,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2424/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=465,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2425/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=465,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2426/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=465,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2427/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=465,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2428/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=466,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2429/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=466,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2430/500000]
+ train/ActionNoiseL2Loss=0.1784
+ throughput/total_tokens=466,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2431/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=466,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2432/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=466,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2433/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=467,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2434/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=467,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2435/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=467,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2436/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=467,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2437/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=467,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2438/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=468,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2439/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=468,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2440/500000]
+ optim/total_grad_norm=1.629
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=468,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2441/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=468,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2442/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=468,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2443/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=469,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2444/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=469,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2445/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=469,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2446/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=469,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2447/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=469,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2448/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=470,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2449/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=470,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2450/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=470,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2451/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=470,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2452/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=470,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2453/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=470,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2454/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=471,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2455/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=471,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2456/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=471,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2457/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=471,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2458/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=471,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2459/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=472,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2460/500000]
+ optim/total_grad_norm=1.585
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=472,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2461/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=472,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2462/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=472,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2463/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=472,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2464/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=473,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2465/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=473,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2466/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=473,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2467/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=473,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2468/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=473,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2469/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=474,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2470/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=474,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2471/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=474,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2472/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=474,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2473/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=474,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2474/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=475,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2475/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=475,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2476/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=475,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2477/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=475,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2478/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=475,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2479/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=475,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2480/500000]
+ optim/total_grad_norm=1.748
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=476,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2481/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=476,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2482/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=476,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2483/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=476,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2484/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=476,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2485/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=477,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2486/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=477,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2487/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=477,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2488/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=477,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2489/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=477,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2490/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=478,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2491/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=478,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2492/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=478,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2493/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=478,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2494/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=478,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2495/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=479,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2496/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=479,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2497/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=479,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2498/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=479,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2499/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=479,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=2500/500000]
+ optim/total_grad_norm=3.811
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=480,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/03 [07:25:13] INFO | >> Saving config... checkpoint.py:608
+10/03 [07:25:49] INFO | >> Saving model state... checkpoint.py:796
+10/03 [07:27:01] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [07:28:25] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2501/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=480,192,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=2502/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=480,384,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=2503/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=480,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=2504/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=480,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2505/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=480,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=2506/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=481,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=2507/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=481,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=2508/500000]
+ train/ActionNoiseL2Loss=0.1442
+ throughput/total_tokens=481,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2509/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=481,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2510/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=481,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2511/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=482,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2512/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=482,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2513/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=482,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2514/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=482,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2515/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=482,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2516/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=483,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2517/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=483,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2518/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=483,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2519/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=483,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2520/500000]
+ optim/total_grad_norm=1.924
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=483,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2521/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=484,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2522/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=484,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2523/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=484,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2524/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=484,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2525/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=484,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2526/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=484,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2527/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=485,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2528/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=485,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2529/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=485,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2530/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=485,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2531/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=485,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2532/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=486,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2533/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=486,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2534/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=486,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2535/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=486,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2536/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=486,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2537/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=487,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2538/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=487,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2539/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=487,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2540/500000]
+ optim/total_grad_norm=2.246
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=487,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2541/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=487,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2542/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=488,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2543/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=488,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2544/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=488,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2545/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=488,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2546/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=488,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2547/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=489,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2548/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=489,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2549/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=489,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2550/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=489,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2551/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=489,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2552/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=489,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2553/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=490,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2554/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=490,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2555/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=490,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2556/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=490,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2557/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=490,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2558/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=491,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2559/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=491,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2560/500000]
+ optim/total_grad_norm=2.070
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=491,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2561/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=491,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2562/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=491,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2563/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=492,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2564/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=492,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2565/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=492,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2566/500000]
+ train/ActionNoiseL2Loss=0.1496
+ throughput/total_tokens=492,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2567/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=492,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2568/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=493,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2569/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=493,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2570/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=493,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2571/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=493,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2572/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=493,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2573/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=494,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2574/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=494,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2575/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=494,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2576/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=494,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2577/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=494,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2578/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=494,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2579/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=495,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2580/500000]
+ optim/total_grad_norm=2.107
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=495,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2581/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=495,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2582/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=495,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2583/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=495,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2584/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=496,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2585/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=496,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2586/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=496,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2587/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=496,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2588/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=496,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2589/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=497,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2590/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=497,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2591/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=497,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2592/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=497,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2593/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=497,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2594/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=498,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2595/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=498,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2596/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=498,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2597/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=498,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2598/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=498,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2599/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=499,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2600/500000]
+ optim/total_grad_norm=2.462
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=499,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2601/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=499,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2602/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=499,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2603/500000]
+ train/ActionNoiseL2Loss=0.1433
+ throughput/total_tokens=499,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2604/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=499,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2605/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=500,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2606/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=500,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2607/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=500,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2608/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=500,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2609/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=500,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2610/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=501,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2611/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=501,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2612/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=501,504,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2613/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=501,696,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2614/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=501,888,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2615/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=502,080,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2616/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=502,272,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2617/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=502,464,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2618/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=502,656,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2619/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=502,848,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2620/500000]
+ optim/total_grad_norm=1.923
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=503,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2621/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=503,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2622/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=503,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2623/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=503,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2624/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=503,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2625/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=504,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2626/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=504,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2627/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=504,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2628/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=504,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2629/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=504,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2630/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=504,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2631/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=505,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2632/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=505,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2633/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=505,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2634/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=505,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2635/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=505,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2636/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=506,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2637/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=506,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2638/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=506,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2639/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=506,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2640/500000]
+ optim/total_grad_norm=1.692
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=506,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2641/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=507,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2642/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=507,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2643/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=507,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2644/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=507,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2645/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=507,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2646/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=508,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2647/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=508,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2648/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=508,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2649/500000]
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=508,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2650/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=508,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2651/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=508,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2652/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=509,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2653/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=509,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2654/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=509,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2655/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=509,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2656/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=509,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2657/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=510,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2658/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=510,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2659/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=510,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2660/500000]
+ optim/total_grad_norm=1.652
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=510,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=2661/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=510,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2662/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=511,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2663/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=511,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2664/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=511,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2665/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=511,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2666/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=511,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2667/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=512,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2668/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=512,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2669/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=512,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2670/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=512,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2671/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=512,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2672/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=513,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2673/500000]
+ train/ActionNoiseL2Loss=0.1154
+ throughput/total_tokens=513,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2674/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=513,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2675/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=513,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2676/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=513,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2677/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=513,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2678/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=514,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2679/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=514,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2680/500000]
+ optim/total_grad_norm=1.410
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=514,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2681/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=514,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2682/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=514,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2683/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=515,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2684/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=515,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2685/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=515,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2686/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=515,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2687/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=515,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2688/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=516,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2689/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=516,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2690/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=516,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2691/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=516,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2692/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=516,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2693/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=517,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2694/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=517,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2695/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=517,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2696/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=517,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2697/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=517,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2698/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=518,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2699/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=518,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2700/500000]
+ optim/total_grad_norm=1.969
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=518,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2701/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=518,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2702/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=518,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2703/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=518,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2704/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=519,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2705/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=519,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2706/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=519,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2707/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=519,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2708/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=519,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2709/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=520,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2710/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=520,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2711/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=520,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2712/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=520,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2713/500000]
+ train/ActionNoiseL2Loss=0.1479
+ throughput/total_tokens=520,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2714/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=521,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2715/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=521,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2716/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=521,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2717/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=521,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2718/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=521,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2719/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=522,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2720/500000]
+ optim/total_grad_norm=2.870
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=522,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2721/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=522,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2722/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=522,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2723/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=522,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2724/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=523,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2725/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=523,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2726/500000]
+ train/ActionNoiseL2Loss=0.1118
+ throughput/total_tokens=523,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2727/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=523,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2728/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=523,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2729/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=523,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2730/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=524,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2731/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=524,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2732/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=524,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2733/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=524,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2734/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=524,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2735/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=525,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2736/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=525,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2737/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=525,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2738/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=525,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2739/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=525,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2740/500000]
+ optim/total_grad_norm=1.724
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=526,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2741/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=526,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2742/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=526,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2743/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=526,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2744/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=526,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2745/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=527,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2746/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=527,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2747/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=527,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2748/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=527,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2749/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=527,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2750/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=528,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2751/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=528,192,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2752/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=528,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2753/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=528,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2754/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=528,768,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2755/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=528,960,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2756/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=529,152,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2757/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=529,344,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2758/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=529,536,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2759/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=529,728,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2760/500000]
+ optim/total_grad_norm=2.576
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=529,920,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2761/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=530,112,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2762/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=530,304,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2763/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=530,496,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2764/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=530,688,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2765/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=530,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2766/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=531,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2767/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=531,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2768/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=531,456,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2769/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=531,648,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2770/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=531,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2771/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=532,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2772/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=532,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2773/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=532,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2774/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=532,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2775/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=532,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2776/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=532,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2777/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=533,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2778/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=533,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2779/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=533,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2780/500000]
+ optim/total_grad_norm=1.847
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=533,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2781/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=533,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2782/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=534,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2783/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=534,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2784/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=534,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2785/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=534,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2786/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=534,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2787/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=535,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2788/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=535,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2789/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=535,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2790/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=535,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2791/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=535,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2792/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=536,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2793/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=536,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2794/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=536,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2795/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=536,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2796/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=536,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2797/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=537,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2798/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=537,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2799/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=537,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2800/500000]
+ optim/total_grad_norm=2.240
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=537,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2801/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=537,792,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2802/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=537,984,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2803/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=538,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2804/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=538,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2805/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=538,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2806/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=538,752,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2807/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=538,944,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2808/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=539,136,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2809/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=539,328,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2810/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=539,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2811/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=539,712,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2812/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=539,904,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2813/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=540,096,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2814/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=540,288,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2815/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=540,480,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2816/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=540,672,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2817/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=540,864,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2818/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=541,056,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2819/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=541,248,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2820/500000]
+ optim/total_grad_norm=1.590
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=541,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2821/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=541,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2822/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=541,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2823/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=542,016,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2824/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=542,208,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2825/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=542,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2826/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=542,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2827/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=542,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2828/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=542,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2829/500000]
+ train/ActionNoiseL2Loss=0.1249
+ throughput/total_tokens=543,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2830/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=543,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2831/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=543,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2832/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=543,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2833/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=543,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2834/500000]
+ train/ActionNoiseL2Loss=0.1577
+ throughput/total_tokens=544,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2835/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=544,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2836/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=544,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2837/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=544,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2838/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=544,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2839/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=545,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2840/500000]
+ optim/total_grad_norm=2.134
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=545,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2841/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=545,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2842/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=545,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2843/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=545,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2844/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=546,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2845/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=546,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2846/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=546,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2847/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=546,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2848/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=546,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2849/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=547,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2850/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=547,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2851/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=547,392,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2852/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=547,584,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2853/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=547,776,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2854/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=547,968,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2855/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=548,160,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2856/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=548,352,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2857/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=548,544,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=2858/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=548,736,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2859/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=548,928,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2860/500000]
+ optim/total_grad_norm=1.650
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=549,120,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2861/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=549,312,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2862/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=549,504,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=2863/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=549,696,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2864/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=549,888,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2865/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=550,080,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2866/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=550,272,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=2867/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=550,464,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=2868/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=550,656,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=2869/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=550,848,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=2870/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=551,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2871/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=551,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2872/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=551,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2873/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=551,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2874/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=551,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2875/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=552,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2876/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=552,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2877/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=552,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2878/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=552,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2879/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=552,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2880/500000]
+ optim/total_grad_norm=0.8881
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=552,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2881/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=553,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2882/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=553,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2883/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=553,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2884/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=553,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2885/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=553,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2886/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=554,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2887/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=554,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2888/500000]
+ train/ActionNoiseL2Loss=0.1543
+ throughput/total_tokens=554,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2889/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=554,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2890/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=554,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2891/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=555,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2892/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=555,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2893/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=555,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2894/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=555,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2895/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=555,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2896/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=556,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2897/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=556,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2898/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=556,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2899/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=556,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2900/500000]
+ optim/total_grad_norm=1.753
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=556,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2901/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=556,992,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2902/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=557,184,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2903/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=557,376,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2904/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=557,568,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2905/500000]
+ train/ActionNoiseL2Loss=0.1704
+ throughput/total_tokens=557,760,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2906/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=557,952,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2907/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=558,144,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2908/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=558,336,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2909/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=558,528,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2910/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=558,720,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2911/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=558,912,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2912/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=559,104,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2913/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=559,296,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2914/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=559,488,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2915/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=559,680,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2916/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=559,872,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2917/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=560,064,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2918/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=560,256,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2919/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=560,448,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2920/500000]
+ optim/total_grad_norm=1.433
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=560,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2921/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=560,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2922/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=561,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2923/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=561,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2924/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=561,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2925/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=561,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2926/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=561,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2927/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=561,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2928/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=562,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2929/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=562,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2930/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=562,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2931/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=562,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2932/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=562,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2933/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=563,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2934/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=563,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2935/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=563,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2936/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=563,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2937/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=563,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2938/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=564,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2939/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=564,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2940/500000]
+ optim/total_grad_norm=1.673
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=564,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2941/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=564,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2942/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=564,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2943/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=565,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2944/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=565,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2945/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=565,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2946/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=565,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2947/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=565,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2948/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=566,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2949/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=566,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2950/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=566,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2951/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=566,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2952/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=566,784,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2953/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=566,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2954/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=567,168,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2955/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=567,360,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2956/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=567,552,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2957/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=567,744,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2958/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=567,936,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2959/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=568,128,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2960/500000]
+ optim/total_grad_norm=1.856
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=568,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=2961/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=568,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2962/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=568,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2963/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=568,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2964/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=569,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2965/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=569,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2966/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=569,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2967/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=569,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2968/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=569,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2969/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=570,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2970/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=570,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=2971/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=570,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2972/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=570,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2973/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=570,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2974/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=571,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2975/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=571,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2976/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=571,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2977/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=571,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2978/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=571,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2979/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=571,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2980/500000]
+ optim/total_grad_norm=2.325
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=572,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2981/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=572,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2982/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=572,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2983/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=572,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2984/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=572,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2985/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=573,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2986/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=573,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2987/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=573,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2988/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=573,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2989/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=573,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2990/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=574,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=2991/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=574,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=2992/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=574,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2993/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=574,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2994/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=574,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2995/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=575,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2996/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=575,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2997/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=575,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2998/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=575,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=2999/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=575,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3000/500000]
+ optim/total_grad_norm=1.902
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=576,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+10/03 [10:23:09] INFO | >> Saving config... checkpoint.py:608
+10/03 [10:23:44] INFO | >> Saving model state... checkpoint.py:796
+10/03 [10:24:56] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [10:26:19] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3001/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=576,192,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=3002/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=576,384,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=3003/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=576,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3004/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=576,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3005/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=576,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3006/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=577,152,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3007/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=577,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3008/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=577,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3009/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=577,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3010/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=577,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3011/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=578,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3012/500000]
+ train/ActionNoiseL2Loss=0.1443
+ throughput/total_tokens=578,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3013/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=578,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3014/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=578,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3015/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=578,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3016/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=579,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3017/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=579,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3018/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=579,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3019/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=579,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3020/500000]
+ optim/total_grad_norm=1.305
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=579,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3021/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=580,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3022/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=580,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3023/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=580,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3024/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=580,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3025/500000]
+ train/ActionNoiseL2Loss=0.1422
+ throughput/total_tokens=580,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3026/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=580,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3027/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=581,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3028/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=581,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3029/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=581,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3030/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=581,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3031/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=581,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3032/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=582,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3033/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=582,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3034/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=582,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3035/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=582,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3036/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=582,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3037/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=583,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3038/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=583,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3039/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=583,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3040/500000]
+ optim/total_grad_norm=2.082
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=583,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3041/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=583,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3042/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=584,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3043/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=584,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3044/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=584,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3045/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=584,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3046/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=584,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3047/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=585,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3048/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=585,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3049/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=585,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3050/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=585,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3051/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=585,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3052/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=585,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3053/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=586,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3054/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=586,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3055/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=586,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3056/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=586,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3057/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=586,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3058/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=587,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3059/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=587,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3060/500000]
+ optim/total_grad_norm=1.784
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=587,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3061/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=587,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3062/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=587,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3063/500000]
+ train/ActionNoiseL2Loss=0.1533
+ throughput/total_tokens=588,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3064/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=588,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3065/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=588,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3066/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=588,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3067/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=588,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3068/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=589,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3069/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=589,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3070/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=589,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3071/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=589,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3072/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=589,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3073/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=590,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3074/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=590,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3075/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=590,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3076/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=590,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3077/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=590,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3078/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=590,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3079/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=591,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3080/500000]
+ optim/total_grad_norm=2.153
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=591,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3081/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=591,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3082/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=591,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3083/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=591,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3084/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=592,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3085/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=592,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3086/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=592,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3087/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=592,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3088/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=592,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3089/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=593,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3090/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=593,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3091/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=593,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3092/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=593,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3093/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=593,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3094/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=594,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3095/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=594,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3096/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=594,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3097/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=594,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3098/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=594,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3099/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=595,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3100/500000]
+ optim/total_grad_norm=1.778
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=595,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3101/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=595,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3102/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=595,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3103/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=595,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3104/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=595,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3105/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=596,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3106/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=596,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3107/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=596,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3108/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=596,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3109/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=596,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3110/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=597,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3111/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=597,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3112/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=597,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3113/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=597,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3114/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=597,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3115/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=598,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3116/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=598,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3117/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=598,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3118/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=598,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3119/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=598,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3120/500000]
+ optim/total_grad_norm=1.230
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=599,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3121/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=599,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3122/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=599,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3123/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=599,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3124/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=599,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3125/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=600,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3126/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=600,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3127/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=600,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3128/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=600,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3129/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=600,768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3130/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=600,960,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3131/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=601,152,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3132/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=601,344,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3133/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=601,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3134/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=601,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3135/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=601,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3136/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=602,112,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3137/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=602,304,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3138/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=602,496,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3139/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=602,688,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3140/500000]
+ optim/total_grad_norm=2.483
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=602,880,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3141/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=603,072,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3142/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=603,264,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3143/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=603,456,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3144/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=603,648,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3145/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=603,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3146/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=604,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3147/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=604,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3148/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=604,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3149/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=604,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3150/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=604,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3151/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=604,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3152/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=605,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3153/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=605,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3154/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=605,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3155/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=605,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3156/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=605,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3157/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=606,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3158/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=606,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3159/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=606,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3160/500000]
+ optim/total_grad_norm=1.140
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=606,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3161/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=606,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3162/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=607,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3163/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=607,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3164/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=607,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3165/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=607,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3166/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=607,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3167/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=608,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3168/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=608,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3169/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=608,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3170/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=608,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3171/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=608,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3172/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=609,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3173/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=609,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3174/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=609,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3175/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=609,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3176/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=609,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3177/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=609,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3178/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=610,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3179/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=610,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3180/500000]
+ optim/total_grad_norm=2.118
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=610,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3181/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=610,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3182/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=610,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3183/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=611,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3184/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=611,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3185/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=611,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3186/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=611,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3187/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=611,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3188/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=612,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3189/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=612,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3190/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=612,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3191/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=612,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3192/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=612,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3193/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=613,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3194/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=613,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3195/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=613,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3196/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=613,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3197/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=613,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3198/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=614,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3199/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=614,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3200/500000]
+ optim/total_grad_norm=1.234
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=614,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3201/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=614,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3202/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=614,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3203/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=614,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3204/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=615,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3205/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=615,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3206/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=615,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3207/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=615,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3208/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=615,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3209/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=616,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3210/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=616,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3211/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=616,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3212/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=616,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3213/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=616,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3214/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=617,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3215/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=617,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3216/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=617,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3217/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=617,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3218/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=617,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3219/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=618,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3220/500000]
+ optim/total_grad_norm=1.230
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=618,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3221/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=618,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3222/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=618,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3223/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=618,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3224/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=619,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3225/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=619,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3226/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=619,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3227/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=619,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3228/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=619,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3229/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=619,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3230/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=620,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3231/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=620,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3232/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=620,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3233/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=620,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3234/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=620,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3235/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=621,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3236/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=621,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3237/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=621,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3238/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=621,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3239/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=621,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3240/500000]
+ optim/total_grad_norm=2.143
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=622,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3241/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=622,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3242/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=622,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3243/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=622,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3244/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=622,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3245/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=623,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3246/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=623,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3247/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=623,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3248/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=623,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3249/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=623,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3250/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=624,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3251/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=624,192,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3252/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=624,384,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3253/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=624,576,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3254/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=624,768,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3255/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=624,960,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3256/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=625,152,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3257/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=625,344,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3258/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=625,536,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3259/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=625,728,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3260/500000]
+ optim/total_grad_norm=1.546
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=625,920,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3261/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=626,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3262/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=626,304,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3263/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=626,496,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3264/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=626,688,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3265/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=626,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3266/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=627,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3267/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=627,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3268/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=627,456,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3269/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=627,648,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3270/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=627,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3271/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=628,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3272/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=628,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3273/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=628,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3274/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=628,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3275/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=628,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3276/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=628,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3277/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=629,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3278/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=629,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3279/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=629,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3280/500000]
+ optim/total_grad_norm=2.407
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=629,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3281/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=629,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3282/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=630,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3283/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=630,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3284/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=630,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3285/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=630,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3286/500000]
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=630,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3287/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=631,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3288/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=631,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3289/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=631,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3290/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=631,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3291/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=631,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3292/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=632,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3293/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=632,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3294/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=632,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3295/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=632,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3296/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=632,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3297/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=633,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3298/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=633,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3299/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=633,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3300/500000]
+ optim/total_grad_norm=1.469
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=633,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3301/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=633,792,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3302/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=633,984,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3303/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=634,176,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3304/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=634,368,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3305/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=634,560,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3306/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=634,752,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3307/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=634,944,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3308/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=635,136,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3309/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=635,328,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3310/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=635,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3311/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=635,712,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3312/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=635,904,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3313/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=636,096,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3314/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=636,288,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3315/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=636,480,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3316/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=636,672,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3317/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=636,864,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3318/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=637,056,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3319/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=637,248,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3320/500000]
+ optim/total_grad_norm=1.530
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=637,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3321/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=637,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3322/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=637,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3323/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=638,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3324/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=638,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3325/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=638,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3326/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=638,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3327/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=638,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3328/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=638,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3329/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=639,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3330/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=639,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3331/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=639,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3332/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=639,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3333/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=639,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3334/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=640,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3335/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=640,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3336/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=640,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3337/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=640,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3338/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=640,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3339/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=641,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3340/500000]
+ optim/total_grad_norm=1.533
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=641,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3341/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=641,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3342/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=641,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3343/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=641,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3344/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=642,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3345/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=642,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3346/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=642,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3347/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=642,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3348/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=642,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3349/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=643,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3350/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=643,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3351/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=643,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3352/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=643,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3353/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=643,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3354/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=643,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3355/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=644,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3356/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=644,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3357/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=644,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3358/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=644,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3359/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=644,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3360/500000]
+ optim/total_grad_norm=1.708
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=645,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3361/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=645,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3362/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=645,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3363/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=645,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3364/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=645,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3365/500000]
+ train/ActionNoiseL2Loss=0.1707
+ throughput/total_tokens=646,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3366/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=646,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3367/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=646,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3368/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=646,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3369/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=646,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3370/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=647,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3371/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=647,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3372/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=647,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3373/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=647,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3374/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=647,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3375/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=648,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3376/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=648,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3377/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=648,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3378/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=648,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3379/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=648,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3380/500000]
+ optim/total_grad_norm=1.028
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=648,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3381/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=649,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3382/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=649,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3383/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=649,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3384/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=649,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3385/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=649,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3386/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=650,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3387/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=650,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3388/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=650,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3389/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=650,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3390/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=650,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3391/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=651,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3392/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=651,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3393/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=651,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3394/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=651,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3395/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=651,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3396/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=652,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3397/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=652,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3398/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=652,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3399/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=652,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3400/500000]
+ optim/total_grad_norm=1.815
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=652,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3401/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=652,992,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3402/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=653,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3403/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=653,376,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3404/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=653,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3405/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=653,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3406/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=653,952,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3407/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=654,144,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3408/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=654,336,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3409/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=654,528,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3410/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=654,720,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3411/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=654,912,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3412/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=655,104,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3413/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=655,296,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3414/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=655,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3415/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=655,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3416/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=655,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3417/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=656,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3418/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=656,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3419/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=656,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3420/500000]
+ optim/total_grad_norm=1.695
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=656,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3421/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=656,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3422/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=657,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3423/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=657,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3424/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=657,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3425/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=657,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3426/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=657,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3427/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=657,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3428/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=658,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3429/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=658,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3430/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=658,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3431/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=658,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3432/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=658,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3433/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=659,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3434/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=659,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3435/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=659,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3436/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=659,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3437/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=659,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3438/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=660,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3439/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=660,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3440/500000]
+ optim/total_grad_norm=2.949
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=660,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3441/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=660,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3442/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=660,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3443/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=661,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3444/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=661,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3445/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=661,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3446/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=661,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3447/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=661,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3448/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=662,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3449/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=662,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3450/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=662,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3451/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=662,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3452/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=662,784,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3453/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=662,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=3454/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=663,168,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=3455/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=663,360,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3456/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=663,552,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3457/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=663,744,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3458/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=663,936,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3459/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=664,128,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3460/500000]
+ optim/total_grad_norm=2.065
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=664,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3461/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=664,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3462/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=664,704,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3463/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=664,896,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3464/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=665,088,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3465/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=665,280,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3466/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=665,472,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3467/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=665,664,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3468/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=665,856,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3469/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=666,048,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3470/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=666,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3471/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=666,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3472/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=666,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3473/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=666,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3474/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=667,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3475/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=667,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3476/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=667,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3477/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=667,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3478/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=667,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3479/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=667,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3480/500000]
+ optim/total_grad_norm=1.591
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=668,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3481/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=668,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3482/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=668,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3483/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=668,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3484/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=668,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3485/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=669,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3486/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=669,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3487/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=669,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3488/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=669,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3489/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=669,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3490/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=670,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3491/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=670,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3492/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=670,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3493/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=670,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3494/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=670,848,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3495/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=671,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3496/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=671,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3497/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=671,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3498/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=671,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3499/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=671,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3500/500000]
+ optim/total_grad_norm=1.576
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=672,000,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+10/03 [13:20:39] INFO | >> Saving config... checkpoint.py:608
+10/03 [13:21:21] INFO | >> Saving model state... checkpoint.py:796
+10/03 [13:22:32] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [13:24:02] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3501/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=672,192,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0490
+[step=3502/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=672,384,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=3503/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=672,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3504/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=672,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3505/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=672,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=3506/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=673,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=3507/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=673,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3508/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=673,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3509/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=673,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3510/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=673,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3511/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=674,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3512/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=674,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3513/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=674,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3514/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=674,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3515/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=674,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3516/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=675,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3517/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=675,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3518/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=675,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3519/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=675,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3520/500000]
+ optim/total_grad_norm=2.632
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=675,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3521/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=676,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3522/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=676,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3523/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=676,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3524/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=676,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3525/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=676,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3526/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=676,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3527/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=677,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3528/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=677,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3529/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=677,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3530/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=677,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3531/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=677,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3532/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=678,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3533/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=678,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3534/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=678,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3535/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=678,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3536/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=678,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3537/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=679,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3538/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=679,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3539/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=679,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3540/500000]
+ optim/total_grad_norm=1.784
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=679,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3541/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=679,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3542/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=680,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3543/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=680,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3544/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=680,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3545/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=680,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3546/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=680,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3547/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=681,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3548/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=681,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3549/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=681,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3550/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=681,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3551/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=681,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3552/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=681,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3553/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=682,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3554/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=682,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3555/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=682,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3556/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=682,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3557/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=682,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3558/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=683,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3559/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=683,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3560/500000]
+ optim/total_grad_norm=1.641
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=683,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3561/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=683,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3562/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=683,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3563/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=684,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3564/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=684,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3565/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=684,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3566/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=684,672,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3567/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=684,864,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3568/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=685,056,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3569/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=685,248,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3570/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=685,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3571/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=685,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3572/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=685,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3573/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=686,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3574/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=686,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3575/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=686,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3576/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=686,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3577/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=686,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3578/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=686,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3579/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=687,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3580/500000]
+ optim/total_grad_norm=0.9988
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=687,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3581/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=687,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3582/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=687,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3583/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=687,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3584/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=688,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3585/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=688,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3586/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=688,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3587/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=688,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3588/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=688,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3589/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=689,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3590/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=689,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3591/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=689,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3592/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=689,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3593/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=689,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3594/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=690,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3595/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=690,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3596/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=690,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3597/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=690,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3598/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=690,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3599/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=691,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3600/500000]
+ optim/total_grad_norm=1.154
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=691,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3601/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=691,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3602/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=691,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3603/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=691,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3604/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=691,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3605/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=692,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3606/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=692,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3607/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=692,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3608/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=692,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3609/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=692,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3610/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=693,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3611/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=693,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3612/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=693,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3613/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=693,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3614/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=693,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3615/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=694,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3616/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=694,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3617/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=694,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3618/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=694,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3619/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=694,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3620/500000]
+ optim/total_grad_norm=2.179
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=695,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3621/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=695,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3622/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=695,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3623/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=695,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3624/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=695,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3625/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=696,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3626/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=696,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3627/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=696,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3628/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=696,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3629/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=696,768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=3630/500000]
+ train/ActionNoiseL2Loss=0.1593
+ throughput/total_tokens=696,960,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3631/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=697,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3632/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=697,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3633/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=697,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3634/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=697,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3635/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=697,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3636/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=698,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3637/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=698,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3638/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=698,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3639/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=698,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3640/500000]
+ optim/total_grad_norm=1.762
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=698,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3641/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=699,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3642/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=699,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3643/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=699,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3644/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=699,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3645/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=699,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3646/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=700,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3647/500000]
+ train/ActionNoiseL2Loss=0.1795
+ throughput/total_tokens=700,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3648/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=700,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3649/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=700,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3650/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=700,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3651/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=700,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3652/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=701,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3653/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=701,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3654/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=701,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3655/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=701,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3656/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=701,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3657/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=702,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3658/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=702,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3659/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=702,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3660/500000]
+ optim/total_grad_norm=1.573
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=702,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3661/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=702,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3662/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=703,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3663/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=703,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3664/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=703,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3665/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=703,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3666/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=703,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3667/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=704,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3668/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=704,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3669/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=704,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3670/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=704,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3671/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=704,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3672/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=705,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3673/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=705,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3674/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=705,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3675/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=705,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3676/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=705,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3677/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=705,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3678/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=706,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3679/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=706,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3680/500000]
+ optim/total_grad_norm=1.604
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=706,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3681/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=706,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3682/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=706,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3683/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=707,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3684/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=707,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3685/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=707,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3686/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=707,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3687/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=707,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3688/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=708,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3689/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=708,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3690/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=708,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3691/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=708,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3692/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=708,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3693/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=709,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3694/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=709,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3695/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=709,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3696/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=709,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3697/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=709,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3698/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=710,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3699/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=710,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3700/500000]
+ optim/total_grad_norm=1.556
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=710,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3701/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=710,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3702/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=710,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3703/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=710,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3704/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=711,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3705/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=711,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3706/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=711,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3707/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=711,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3708/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=711,936,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3709/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=712,128,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3710/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=712,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3711/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=712,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3712/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=712,704,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3713/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=712,896,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3714/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=713,088,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3715/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=713,280,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3716/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=713,472,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3717/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=713,664,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3718/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=713,856,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3719/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=714,048,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3720/500000]
+ optim/total_grad_norm=2.306
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=714,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3721/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=714,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3722/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=714,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3723/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=714,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3724/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=715,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3725/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=715,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3726/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=715,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3727/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=715,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3728/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=715,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3729/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=715,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3730/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=716,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3731/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=716,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3732/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=716,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3733/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=716,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3734/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=716,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3735/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=717,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3736/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=717,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3737/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=717,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3738/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=717,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3739/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=717,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3740/500000]
+ optim/total_grad_norm=2.060
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=718,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3741/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=718,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3742/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=718,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3743/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=718,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3744/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=718,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3745/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=719,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3746/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=719,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3747/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=719,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3748/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=719,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3749/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=719,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3750/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=720,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3751/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=720,192,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3752/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=720,384,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3753/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=720,576,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3754/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=720,768,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3755/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=720,960,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3756/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=721,152,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3757/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=721,344,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3758/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=721,536,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3759/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=721,728,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3760/500000]
+ optim/total_grad_norm=1.176
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=721,920,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3761/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=722,112,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3762/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=722,304,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3763/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=722,496,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3764/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=722,688,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3765/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=722,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3766/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=723,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3767/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=723,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3768/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=723,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3769/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=723,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3770/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=723,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3771/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=724,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3772/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=724,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3773/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=724,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3774/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=724,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3775/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=724,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3776/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=724,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3777/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=725,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3778/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=725,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3779/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=725,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3780/500000]
+ optim/total_grad_norm=1.396
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=725,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3781/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=725,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3782/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=726,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3783/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=726,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3784/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=726,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3785/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=726,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3786/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=726,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3787/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=727,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3788/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=727,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3789/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=727,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3790/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=727,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3791/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=727,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3792/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=728,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3793/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=728,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3794/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=728,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3795/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=728,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3796/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=728,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3797/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=729,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3798/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=729,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3799/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=729,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3800/500000]
+ optim/total_grad_norm=2.023
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=729,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3801/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=729,792,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3802/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=729,984,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3803/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=730,176,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3804/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=730,368,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3805/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=730,560,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3806/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=730,752,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3807/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=730,944,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3808/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=731,136,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3809/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=731,328,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3810/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=731,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3811/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=731,712,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3812/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=731,904,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3813/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=732,096,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3814/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=732,288,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3815/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=732,480,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3816/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=732,672,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3817/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=732,864,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3818/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=733,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3819/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=733,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3820/500000]
+ optim/total_grad_norm=1.400
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=733,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3821/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=733,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3822/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=733,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3823/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=734,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3824/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=734,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3825/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=734,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3826/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=734,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3827/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=734,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3828/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=734,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3829/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=735,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3830/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=735,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3831/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=735,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3832/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=735,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3833/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=735,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3834/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=736,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3835/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=736,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3836/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=736,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3837/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=736,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3838/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=736,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3839/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=737,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3840/500000]
+ optim/total_grad_norm=0.8565
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=737,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3841/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=737,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3842/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=737,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3843/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=737,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3844/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=738,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3845/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=738,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3846/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=738,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3847/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=738,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3848/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=738,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3849/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=739,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3850/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=739,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3851/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=739,392,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=3852/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=739,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3853/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=739,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3854/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=739,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3855/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=740,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3856/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=740,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3857/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=740,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3858/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=740,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3859/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=740,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3860/500000]
+ optim/total_grad_norm=1.725
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=741,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3861/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=741,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3862/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=741,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3863/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=741,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3864/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=741,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3865/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=742,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3866/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=742,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3867/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=742,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3868/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=742,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3869/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=742,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3870/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=743,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3871/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=743,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3872/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=743,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3873/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=743,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3874/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=743,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3875/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=744,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3876/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=744,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3877/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=744,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3878/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=744,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3879/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=744,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3880/500000]
+ optim/total_grad_norm=1.898
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=744,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3881/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=745,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3882/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=745,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3883/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=745,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3884/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=745,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3885/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=745,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3886/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=746,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3887/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=746,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3888/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=746,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3889/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=746,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3890/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=746,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3891/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=747,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3892/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=747,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3893/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=747,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3894/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=747,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3895/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=747,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3896/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=748,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3897/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=748,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3898/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=748,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3899/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=748,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3900/500000]
+ optim/total_grad_norm=1.368
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=748,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3901/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=748,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3902/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=749,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3903/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=749,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3904/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=749,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3905/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=749,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3906/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=749,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3907/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=750,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3908/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=750,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3909/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=750,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3910/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=750,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3911/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=750,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3912/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=751,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3913/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=751,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3914/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=751,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3915/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=751,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3916/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=751,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3917/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=752,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3918/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=752,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3919/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=752,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3920/500000]
+ optim/total_grad_norm=1.541
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=752,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3921/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=752,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3922/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=753,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3923/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=753,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3924/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=753,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3925/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=753,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3926/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=753,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3927/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=753,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3928/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=754,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3929/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=754,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3930/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=754,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3931/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=754,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3932/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=754,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3933/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=755,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3934/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=755,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3935/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=755,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3936/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=755,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3937/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=755,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3938/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=756,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3939/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=756,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3940/500000]
+ optim/total_grad_norm=2.266
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=756,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3941/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=756,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3942/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=756,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3943/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=757,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3944/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=757,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3945/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=757,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3946/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=757,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3947/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=757,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3948/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=758,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3949/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=758,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3950/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=758,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3951/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=758,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3952/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=758,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3953/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=758,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3954/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=759,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3955/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=759,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3956/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=759,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3957/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=759,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3958/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=759,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3959/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=760,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3960/500000]
+ optim/total_grad_norm=2.094
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=760,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=3961/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=760,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3962/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=760,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3963/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=760,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3964/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=761,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3965/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=761,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3966/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=761,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3967/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=761,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3968/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=761,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3969/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=762,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3970/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=762,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3971/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=762,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3972/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=762,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3973/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=762,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3974/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=763,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3975/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=763,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3976/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=763,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3977/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=763,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3978/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=763,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3979/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=763,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3980/500000]
+ optim/total_grad_norm=1.674
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=764,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=3981/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=764,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3982/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=764,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3983/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=764,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=3984/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=764,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3985/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=765,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3986/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=765,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3987/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=765,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3988/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=765,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3989/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=765,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3990/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=766,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=3991/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=766,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3992/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=766,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3993/500000]
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=766,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3994/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=766,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3995/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=767,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3996/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=767,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3997/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=767,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3998/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=767,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=3999/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=767,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4000/500000]
+ optim/total_grad_norm=1.980
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=768,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+10/03 [16:18:49] INFO | >> Saving config... checkpoint.py:608
+10/03 [16:19:21] INFO | >> Saving model state... checkpoint.py:796
+10/03 [16:20:34] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [16:21:58] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4001/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=768,192,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=4002/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=768,384,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=4003/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=768,576,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=4004/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=768,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4005/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=768,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4006/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=769,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4007/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=769,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4008/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=769,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4009/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=769,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4010/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=769,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4011/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=770,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4012/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=770,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4013/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=770,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4014/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=770,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4015/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=770,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4016/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=771,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4017/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=771,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4018/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=771,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4019/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=771,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4020/500000]
+ optim/total_grad_norm=1.043
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=771,840,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4021/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=772,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4022/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=772,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4023/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=772,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4024/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=772,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4025/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=772,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4026/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=772,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4027/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=773,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4028/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=773,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4029/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=773,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4030/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=773,760,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4031/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=773,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4032/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=774,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4033/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=774,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4034/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=774,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4035/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=774,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4036/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=774,912,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4037/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=775,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4038/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=775,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4039/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=775,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4040/500000]
+ optim/total_grad_norm=1.836
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=775,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4041/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=775,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4042/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=776,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4043/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=776,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4044/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=776,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4045/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=776,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4046/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=776,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4047/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=777,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4048/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=777,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4049/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=777,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4050/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=777,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4051/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=777,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4052/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=777,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4053/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=778,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4054/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=778,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4055/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=778,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4056/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=778,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4057/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=778,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4058/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=779,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4059/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=779,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4060/500000]
+ optim/total_grad_norm=1.907
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=779,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4061/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=779,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4062/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=779,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4063/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=780,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4064/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=780,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4065/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=780,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4066/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=780,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4067/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=780,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4068/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=781,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4069/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=781,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4070/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=781,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4071/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=781,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4072/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=781,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4073/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=782,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4074/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=782,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4075/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=782,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4076/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=782,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4077/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=782,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4078/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=782,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4079/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=783,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4080/500000]
+ optim/total_grad_norm=1.933
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=783,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4081/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=783,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4082/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=783,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4083/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=783,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4084/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=784,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4085/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=784,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4086/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=784,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4087/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=784,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4088/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=784,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4089/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=785,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4090/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=785,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4091/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=785,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4092/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=785,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4093/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=785,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4094/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=786,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4095/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=786,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4096/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=786,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4097/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=786,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4098/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=786,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4099/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=787,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4100/500000]
+ optim/total_grad_norm=1.856
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=787,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4101/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=787,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4102/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=787,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4103/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=787,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4104/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=787,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4105/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=788,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4106/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=788,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4107/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=788,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4108/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=788,736,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4109/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=788,928,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4110/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=789,120,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4111/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=789,312,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4112/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=789,504,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4113/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=789,696,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4114/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=789,888,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4115/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=790,080,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4116/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=790,272,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4117/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=790,464,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4118/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=790,656,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4119/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=790,848,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4120/500000]
+ optim/total_grad_norm=3.187
+ train/ActionNoiseL2Loss=0.1521
+ throughput/total_tokens=791,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4121/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=791,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4122/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=791,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4123/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=791,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4124/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=791,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4125/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=792,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4126/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=792,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4127/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=792,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4128/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=792,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4129/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=792,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4130/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=792,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4131/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=793,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4132/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=793,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4133/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=793,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4134/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=793,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4135/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=793,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4136/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=794,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4137/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=794,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4138/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=794,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4139/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=794,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4140/500000]
+ optim/total_grad_norm=1.488
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=794,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4141/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=795,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4142/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=795,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4143/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=795,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4144/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=795,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4145/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=795,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4146/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=796,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4147/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=796,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4148/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=796,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4149/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=796,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4150/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=796,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4151/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=796,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4152/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=797,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4153/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=797,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4154/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=797,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4155/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=797,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4156/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=797,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4157/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=798,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4158/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=798,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4159/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=798,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4160/500000]
+ optim/total_grad_norm=1.572
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=798,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=4161/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=798,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4162/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=799,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4163/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=799,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4164/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=799,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4165/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=799,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4166/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=799,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4167/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=800,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4168/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=800,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4169/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=800,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4170/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=800,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4171/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=800,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4172/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=801,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4173/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=801,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4174/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=801,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4175/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=801,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4176/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=801,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4177/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=801,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4178/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=802,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4179/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=802,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4180/500000]
+ optim/total_grad_norm=1.280
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=802,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4181/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=802,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4182/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=802,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4183/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=803,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4184/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=803,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4185/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=803,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4186/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=803,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4187/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=803,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4188/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=804,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4189/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=804,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4190/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=804,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4191/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=804,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4192/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=804,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4193/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=805,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4194/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=805,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4195/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=805,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4196/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=805,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4197/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=805,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4198/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=806,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4199/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=806,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4200/500000]
+ optim/total_grad_norm=1.598
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=806,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4201/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=806,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4202/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=806,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4203/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=806,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4204/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=807,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4205/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=807,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4206/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=807,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4207/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=807,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4208/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=807,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4209/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=808,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4210/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=808,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4211/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=808,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4212/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=808,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4213/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=808,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4214/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=809,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4215/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=809,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4216/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=809,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4217/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=809,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4218/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=809,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4219/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=810,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4220/500000]
+ optim/total_grad_norm=1.248
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=810,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4221/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=810,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4222/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=810,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4223/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=810,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4224/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=811,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4225/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=811,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4226/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=811,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4227/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=811,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4228/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=811,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4229/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=811,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4230/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=812,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4231/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=812,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4232/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=812,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4233/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=812,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4234/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=812,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4235/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=813,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4236/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=813,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4237/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=813,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4238/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=813,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4239/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=813,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4240/500000]
+ optim/total_grad_norm=1.823
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=814,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4241/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=814,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4242/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=814,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4243/500000]
+ train/ActionNoiseL2Loss=0.1410
+ throughput/total_tokens=814,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4244/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=814,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4245/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=815,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4246/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=815,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4247/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=815,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4248/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=815,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4249/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=815,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4250/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=816,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4251/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=816,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4252/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=816,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4253/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=816,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4254/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=816,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4255/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=816,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4256/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=817,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4257/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=817,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4258/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=817,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4259/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=817,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4260/500000]
+ optim/total_grad_norm=1.614
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=817,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4261/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=818,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4262/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=818,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4263/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=818,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4264/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=818,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4265/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=818,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4266/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=819,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4267/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=819,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4268/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=819,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4269/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=819,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4270/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=819,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4271/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=820,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4272/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=820,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4273/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=820,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4274/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=820,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4275/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=820,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4276/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=820,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4277/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=821,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4278/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=821,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4279/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=821,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4280/500000]
+ optim/total_grad_norm=2.050
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=821,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4281/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=821,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4282/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=822,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4283/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=822,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4284/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=822,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4285/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=822,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4286/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=822,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4287/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=823,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4288/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=823,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4289/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=823,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4290/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=823,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4291/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=823,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4292/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=824,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4293/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=824,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4294/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=824,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4295/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=824,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4296/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=824,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4297/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=825,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4298/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=825,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4299/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=825,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4300/500000]
+ optim/total_grad_norm=1.888
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=825,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4301/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=825,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4302/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=825,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4303/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=826,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4304/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=826,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4305/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=826,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4306/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=826,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4307/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=826,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4308/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=827,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4309/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=827,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4310/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=827,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4311/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=827,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4312/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=827,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4313/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=828,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4314/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=828,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4315/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=828,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4316/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=828,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4317/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=828,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4318/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=829,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4319/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=829,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4320/500000]
+ optim/total_grad_norm=2.269
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=829,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4321/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=829,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4322/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=829,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4323/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=830,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4324/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=830,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4325/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=830,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4326/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=830,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4327/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=830,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4328/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=830,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4329/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=831,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4330/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=831,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4331/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=831,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4332/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=831,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4333/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=831,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4334/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=832,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4335/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=832,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4336/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=832,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4337/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=832,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4338/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=832,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4339/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=833,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4340/500000]
+ optim/total_grad_norm=2.213
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=833,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4341/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=833,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4342/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=833,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4343/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=833,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4344/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=834,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4345/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=834,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4346/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=834,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4347/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=834,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4348/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=834,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4349/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=835,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4350/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=835,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4351/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=835,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4352/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=835,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4353/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=835,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4354/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=835,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4355/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=836,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4356/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=836,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4357/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=836,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4358/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=836,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4359/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=836,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4360/500000]
+ optim/total_grad_norm=1.133
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=837,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4361/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=837,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4362/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=837,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4363/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=837,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4364/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=837,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4365/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=838,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4366/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=838,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4367/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=838,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4368/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=838,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4369/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=838,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4370/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=839,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4371/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=839,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4372/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=839,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4373/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=839,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4374/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=839,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4375/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=840,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4376/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=840,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4377/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=840,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4378/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=840,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4379/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=840,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4380/500000]
+ optim/total_grad_norm=1.802
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=840,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4381/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=841,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4382/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=841,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4383/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=841,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4384/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=841,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4385/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=841,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4386/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=842,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4387/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=842,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4388/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=842,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4389/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=842,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4390/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=842,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4391/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=843,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4392/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=843,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4393/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=843,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4394/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=843,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4395/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=843,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4396/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=844,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4397/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=844,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4398/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=844,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4399/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=844,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4400/500000]
+ optim/total_grad_norm=2.337
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=844,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4401/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=844,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4402/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=845,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4403/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=845,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4404/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=845,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4405/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=845,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4406/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=845,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4407/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=846,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4408/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=846,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4409/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=846,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4410/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=846,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4411/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=846,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4412/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=847,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4413/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=847,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4414/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=847,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4415/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=847,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4416/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=847,872,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4417/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=848,064,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4418/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=848,256,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4419/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=848,448,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4420/500000]
+ optim/total_grad_norm=1.488
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=848,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4421/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=848,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4422/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=849,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4423/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=849,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4424/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=849,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4425/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=849,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4426/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=849,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4427/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=849,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4428/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=850,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4429/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=850,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4430/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=850,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4431/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=850,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4432/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=850,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4433/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=851,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4434/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=851,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4435/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=851,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4436/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=851,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4437/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=851,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4438/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=852,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4439/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=852,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4440/500000]
+ optim/total_grad_norm=1.552
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=852,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4441/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=852,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4442/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=852,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4443/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=853,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4444/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=853,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4445/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=853,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4446/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=853,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4447/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=853,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4448/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=854,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4449/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=854,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4450/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=854,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4451/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=854,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4452/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=854,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4453/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=854,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4454/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=855,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4455/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=855,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4456/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=855,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4457/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=855,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4458/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=855,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4459/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=856,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4460/500000]
+ optim/total_grad_norm=1.318
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=856,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4461/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=856,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4462/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=856,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4463/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=856,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4464/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=857,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4465/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=857,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4466/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=857,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4467/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=857,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4468/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=857,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4469/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=858,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4470/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=858,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4471/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=858,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4472/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=858,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4473/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=858,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4474/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=859,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4475/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=859,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4476/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=859,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4477/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=859,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4478/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=859,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4479/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=859,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4480/500000]
+ optim/total_grad_norm=1.389
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=860,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4481/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=860,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4482/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=860,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4483/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=860,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4484/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=860,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4485/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=861,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4486/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=861,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4487/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=861,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4488/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=861,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4489/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=861,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4490/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=862,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4491/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=862,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4492/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=862,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4493/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=862,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4494/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=862,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4495/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=863,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4496/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=863,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4497/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=863,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4498/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=863,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4499/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=863,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4500/500000]
+ optim/total_grad_norm=1.212
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=864,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+10/03 [19:16:27] INFO | >> Saving config... checkpoint.py:608
+10/03 [19:17:08] INFO | >> Saving model state... checkpoint.py:796
+10/03 [19:18:21] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [19:19:52] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4501/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=864,192,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=4502/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=864,384,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=4503/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=864,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=4504/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=864,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=4505/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=864,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4506/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=865,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=4507/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=865,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4508/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=865,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4509/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=865,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4510/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=865,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4511/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=866,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4512/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=866,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4513/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=866,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4514/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=866,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4515/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=866,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4516/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=867,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4517/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=867,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4518/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=867,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4519/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=867,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4520/500000]
+ optim/total_grad_norm=1.246
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=867,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4521/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=868,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4522/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=868,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4523/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=868,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4524/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=868,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4525/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=868,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4526/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=868,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4527/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=869,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4528/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=869,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4529/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=869,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4530/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=869,760,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4531/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=869,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4532/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=870,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4533/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=870,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4534/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=870,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4535/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=870,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4536/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=870,912,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4537/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=871,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4538/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=871,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4539/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=871,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4540/500000]
+ optim/total_grad_norm=1.055
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=871,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4541/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=871,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4542/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=872,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4543/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=872,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4544/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=872,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4545/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=872,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4546/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=872,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4547/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=873,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4548/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=873,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4549/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=873,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4550/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=873,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4551/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=873,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4552/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=873,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4553/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=874,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4554/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=874,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4555/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=874,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4556/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=874,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4557/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=874,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4558/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=875,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4559/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=875,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4560/500000]
+ optim/total_grad_norm=1.291
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=875,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4561/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=875,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4562/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=875,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4563/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=876,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4564/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=876,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4565/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=876,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4566/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=876,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4567/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=876,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4568/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=877,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4569/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=877,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4570/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=877,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4571/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=877,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4572/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=877,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4573/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=878,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4574/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=878,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4575/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=878,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4576/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=878,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4577/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=878,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4578/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=878,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4579/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=879,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4580/500000]
+ optim/total_grad_norm=1.267
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=879,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4581/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=879,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4582/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=879,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4583/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=879,936,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=4584/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=880,128,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=4585/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=880,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4586/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=880,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4587/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=880,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4588/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=880,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4589/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=881,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4590/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=881,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4591/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=881,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4592/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=881,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4593/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=881,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4594/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=882,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4595/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=882,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4596/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=882,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4597/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=882,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4598/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=882,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4599/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=883,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4600/500000]
+ optim/total_grad_norm=0.9343
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=883,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4601/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=883,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4602/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=883,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4603/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=883,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4604/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=883,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4605/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=884,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4606/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=884,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4607/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=884,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4608/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=884,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4609/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=884,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4610/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=885,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=4611/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=885,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4612/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=885,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4613/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=885,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4614/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=885,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4615/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=886,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4616/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=886,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4617/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=886,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4618/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=886,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4619/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=886,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4620/500000]
+ optim/total_grad_norm=1.313
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=887,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4621/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=887,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4622/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=887,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4623/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=887,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4624/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=887,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4625/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=888,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4626/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=888,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4627/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=888,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4628/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=888,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4629/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=888,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4630/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=888,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4631/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=889,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4632/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=889,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4633/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=889,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4634/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=889,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4635/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=889,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4636/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=890,112,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4637/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=890,304,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4638/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=890,496,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4639/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=890,688,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4640/500000]
+ optim/total_grad_norm=1.491
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=890,880,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4641/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=891,072,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4642/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=891,264,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4643/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=891,456,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4644/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=891,648,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4645/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=891,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4646/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=892,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4647/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=892,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4648/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=892,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4649/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=892,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4650/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=892,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4651/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=892,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4652/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=893,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4653/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=893,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4654/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=893,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4655/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=893,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4656/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=893,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4657/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=894,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4658/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=894,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4659/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=894,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4660/500000]
+ optim/total_grad_norm=1.545
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=894,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4661/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=894,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4662/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=895,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4663/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=895,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4664/500000]
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=895,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4665/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=895,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4666/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=895,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4667/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=896,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4668/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=896,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4669/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=896,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4670/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=896,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4671/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=896,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4672/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=897,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4673/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=897,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4674/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=897,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4675/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=897,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4676/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=897,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4677/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=897,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4678/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=898,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4679/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=898,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4680/500000]
+ optim/total_grad_norm=1.727
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=898,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4681/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=898,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4682/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=898,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4683/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=899,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4684/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=899,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4685/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=899,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4686/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=899,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4687/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=899,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4688/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=900,096,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4689/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=900,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4690/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=900,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4691/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=900,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4692/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=900,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4693/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=901,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4694/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=901,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4695/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=901,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4696/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=901,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4697/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=901,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4698/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=902,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4699/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=902,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4700/500000]
+ optim/total_grad_norm=1.008
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=902,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4701/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=902,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4702/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=902,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4703/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=902,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4704/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=903,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4705/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=903,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4706/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=903,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4707/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=903,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4708/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=903,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4709/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=904,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4710/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=904,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4711/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=904,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4712/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=904,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4713/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=904,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4714/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=905,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4715/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=905,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4716/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=905,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4717/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=905,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4718/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=905,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4719/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=906,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4720/500000]
+ optim/total_grad_norm=1.840
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=906,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4721/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=906,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4722/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=906,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4723/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=906,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4724/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=907,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4725/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=907,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4726/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=907,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4727/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=907,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4728/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=907,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4729/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=907,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4730/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=908,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4731/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=908,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4732/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=908,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4733/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=908,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4734/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=908,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4735/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=909,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4736/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=909,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4737/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=909,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4738/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=909,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4739/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=909,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4740/500000]
+ optim/total_grad_norm=1.690
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=910,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4741/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=910,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4742/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=910,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4743/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=910,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4744/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=910,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4745/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=911,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4746/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=911,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4747/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=911,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4748/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=911,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4749/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=911,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4750/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=912,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4751/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=912,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4752/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=912,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4753/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=912,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4754/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=912,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4755/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=912,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4756/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=913,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4757/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=913,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4758/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=913,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4759/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=913,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4760/500000]
+ optim/total_grad_norm=2.168
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=913,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4761/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=914,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4762/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=914,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4763/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=914,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4764/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=914,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4765/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=914,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4766/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=915,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4767/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=915,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4768/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=915,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4769/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=915,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4770/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=915,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=4771/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=916,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4772/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=916,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4773/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=916,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4774/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=916,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4775/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=916,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=4776/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=916,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4777/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=917,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4778/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=917,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4779/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=917,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4780/500000]
+ optim/total_grad_norm=1.434
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=917,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4781/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=917,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4782/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=918,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4783/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=918,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4784/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=918,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4785/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=918,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4786/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=918,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4787/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=919,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4788/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=919,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4789/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=919,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4790/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=919,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4791/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=919,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4792/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=920,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4793/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=920,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4794/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=920,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4795/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=920,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4796/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=920,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4797/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=921,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4798/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=921,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4799/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=921,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4800/500000]
+ optim/total_grad_norm=2.080
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=921,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4801/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=921,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4802/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=921,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4803/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=922,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4804/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=922,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4805/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=922,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4806/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=922,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4807/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=922,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4808/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=923,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4809/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=923,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4810/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=923,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4811/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=923,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4812/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=923,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4813/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=924,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4814/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=924,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4815/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=924,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4816/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=924,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4817/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=924,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4818/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=925,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4819/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=925,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4820/500000]
+ optim/total_grad_norm=1.489
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=925,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4821/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=925,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4822/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=925,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4823/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=926,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4824/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=926,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4825/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=926,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4826/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=926,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4827/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=926,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4828/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=926,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4829/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=927,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4830/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=927,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4831/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=927,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4832/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=927,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4833/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=927,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4834/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=928,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4835/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=928,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4836/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=928,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4837/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=928,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4838/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=928,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4839/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=929,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4840/500000]
+ optim/total_grad_norm=1.104
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=929,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4841/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=929,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4842/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=929,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4843/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=929,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4844/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=930,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4845/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=930,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4846/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=930,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4847/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=930,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4848/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=930,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4849/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=931,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4850/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=931,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4851/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=931,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4852/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=931,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4853/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=931,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4854/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=931,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4855/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=932,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4856/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=932,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4857/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=932,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4858/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=932,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4859/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=932,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4860/500000]
+ optim/total_grad_norm=2.169
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=933,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4861/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=933,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4862/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=933,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4863/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=933,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4864/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=933,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4865/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=934,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4866/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=934,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4867/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=934,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4868/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=934,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4869/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=934,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4870/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=935,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4871/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=935,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4872/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=935,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4873/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=935,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4874/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=935,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4875/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=936,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4876/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=936,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4877/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=936,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4878/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=936,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4879/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=936,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4880/500000]
+ optim/total_grad_norm=1.156
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=936,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4881/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=937,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4882/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=937,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4883/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=937,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4884/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=937,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4885/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=937,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4886/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=938,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4887/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=938,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4888/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=938,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4889/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=938,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4890/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=938,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4891/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=939,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4892/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=939,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4893/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=939,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4894/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=939,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4895/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=939,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4896/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=940,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4897/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=940,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4898/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=940,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4899/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=940,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4900/500000]
+ optim/total_grad_norm=1.826
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=940,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4901/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=940,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4902/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=941,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4903/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=941,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4904/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=941,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4905/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=941,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4906/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=941,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4907/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=942,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4908/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=942,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4909/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=942,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4910/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=942,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4911/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=942,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4912/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=943,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4913/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=943,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4914/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=943,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4915/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=943,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4916/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=943,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4917/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=944,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4918/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=944,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4919/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=944,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4920/500000]
+ optim/total_grad_norm=1.746
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=944,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4921/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=944,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4922/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=945,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4923/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=945,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4924/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=945,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4925/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=945,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4926/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=945,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4927/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=945,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4928/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=946,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4929/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=946,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4930/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=946,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4931/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=946,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4932/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=946,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4933/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=947,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4934/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=947,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4935/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=947,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4936/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=947,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4937/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=947,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4938/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=948,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4939/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=948,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4940/500000]
+ optim/total_grad_norm=1.343
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=948,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4941/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=948,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4942/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=948,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4943/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=949,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4944/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=949,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4945/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=949,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4946/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=949,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4947/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=949,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4948/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=950,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4949/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=950,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4950/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=950,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4951/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=950,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4952/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=950,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4953/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=950,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4954/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=951,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4955/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=951,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=4956/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=951,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4957/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=951,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4958/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=951,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4959/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=952,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4960/500000]
+ optim/total_grad_norm=1.980
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=952,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=4961/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=952,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4962/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=952,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4963/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=952,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4964/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=953,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4965/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=953,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4966/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=953,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4967/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=953,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4968/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=953,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4969/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=954,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4970/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=954,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4971/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=954,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4972/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=954,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4973/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=954,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4974/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=955,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4975/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=955,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4976/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=955,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4977/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=955,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4978/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=955,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4979/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=955,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4980/500000]
+ optim/total_grad_norm=2.278
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=956,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4981/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=956,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4982/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=956,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4983/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=956,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4984/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=956,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4985/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=957,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4986/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=957,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4987/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=957,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4988/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=957,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4989/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=957,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4990/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=958,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=4991/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=958,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4992/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=958,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4993/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=958,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=4994/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=958,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4995/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=959,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4996/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=959,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4997/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=959,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4998/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=959,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=4999/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=959,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5000/500000]
+ optim/total_grad_norm=1.358
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=960,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/03 [22:14:31] INFO | >> Saving config... checkpoint.py:608
+10/03 [22:15:15] INFO | >> Saving model state... checkpoint.py:796
+10/03 [22:16:27] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [22:17:57] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5001/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=960,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5002/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=960,384,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=5003/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=960,576,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5004/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=960,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=5005/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=960,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5006/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=961,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5007/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=961,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5008/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=961,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=5009/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=961,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5010/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=961,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5011/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=962,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5012/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=962,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5013/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=962,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5014/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=962,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5015/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=962,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5016/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=963,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5017/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=963,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5018/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=963,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5019/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=963,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5020/500000]
+ optim/total_grad_norm=1.014
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=963,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5021/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=964,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5022/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=964,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5023/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=964,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5024/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=964,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5025/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=964,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5026/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=964,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5027/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=965,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5028/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=965,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5029/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=965,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5030/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=965,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5031/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=965,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5032/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=966,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5033/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=966,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5034/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=966,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5035/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=966,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5036/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=966,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5037/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=967,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5038/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=967,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5039/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=967,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5040/500000]
+ optim/total_grad_norm=1.203
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=967,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5041/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=967,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5042/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=968,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5043/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=968,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5044/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=968,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5045/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=968,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5046/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=968,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5047/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=969,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5048/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=969,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5049/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=969,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5050/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=969,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5051/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=969,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5052/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=969,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5053/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=970,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5054/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=970,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5055/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=970,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5056/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=970,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5057/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=970,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5058/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=971,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5059/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=971,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5060/500000]
+ optim/total_grad_norm=0.9793
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=971,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5061/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=971,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5062/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=971,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5063/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=972,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5064/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=972,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5065/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=972,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5066/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=972,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5067/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=972,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5068/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=973,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5069/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=973,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5070/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=973,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5071/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=973,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5072/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=973,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5073/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=974,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5074/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=974,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5075/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=974,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5076/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=974,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5077/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=974,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5078/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=974,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5079/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=975,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5080/500000]
+ optim/total_grad_norm=1.482
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=975,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5081/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=975,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5082/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=975,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5083/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=975,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5084/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=976,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5085/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=976,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5086/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=976,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5087/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=976,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5088/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=976,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5089/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=977,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5090/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=977,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5091/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=977,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5092/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=977,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5093/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=977,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5094/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=978,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5095/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=978,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5096/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=978,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5097/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=978,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5098/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=978,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5099/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=979,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5100/500000]
+ optim/total_grad_norm=1.773
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=979,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5101/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=979,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5102/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=979,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5103/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=979,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5104/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=979,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5105/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=980,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5106/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=980,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5107/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=980,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5108/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=980,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5109/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=980,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5110/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=981,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5111/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=981,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5112/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=981,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5113/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=981,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5114/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=981,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5115/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=982,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5116/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=982,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5117/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=982,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5118/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=982,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5119/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=982,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5120/500000]
+ optim/total_grad_norm=0.7326
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=983,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5121/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=983,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5122/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=983,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5123/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=983,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5124/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=983,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5125/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=984,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5126/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=984,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5127/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=984,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5128/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=984,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5129/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=984,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5130/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=984,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5131/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=985,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5132/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=985,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5133/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=985,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5134/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=985,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5135/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=985,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5136/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=986,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5137/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=986,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5138/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=986,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5139/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=986,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5140/500000]
+ optim/total_grad_norm=1.084
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=986,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5141/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=987,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5142/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=987,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5143/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=987,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5144/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=987,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5145/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=987,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5146/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=988,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5147/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=988,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5148/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=988,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5149/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=988,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5150/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=988,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5151/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=988,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5152/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=989,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5153/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=989,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5154/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=989,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5155/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=989,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5156/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=989,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5157/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=990,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5158/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=990,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5159/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=990,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5160/500000]
+ optim/total_grad_norm=1.045
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=990,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=5161/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=990,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5162/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=991,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5163/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=991,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5164/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=991,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5165/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=991,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5166/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=991,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5167/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=992,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5168/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=992,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5169/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=992,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5170/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=992,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5171/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=992,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5172/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=993,024,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=5173/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=993,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5174/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=993,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5175/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=993,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5176/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=993,792,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=5177/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=993,984,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5178/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=994,176,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5179/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=994,368,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5180/500000]
+ optim/total_grad_norm=1.121
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=994,560,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5181/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=994,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5182/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=994,944,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5183/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=995,136,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5184/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=995,328,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5185/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=995,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5186/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=995,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5187/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=995,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5188/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=996,096,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5189/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=996,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5190/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=996,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5191/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=996,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5192/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=996,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5193/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=997,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5194/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=997,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5195/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=997,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5196/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=997,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5197/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=997,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5198/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=998,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5199/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=998,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5200/500000]
+ optim/total_grad_norm=0.9743
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=998,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5201/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=998,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5202/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=998,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5203/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=998,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5204/500000]
+ train/ActionNoiseL2Loss=0.1240
+ throughput/total_tokens=999,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5205/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=999,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5206/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=999,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5207/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=999,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5208/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=999,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5209/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,000,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5210/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,000,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=5211/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,000,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5212/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,000,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5213/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,000,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5214/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,001,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5215/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,001,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5216/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,001,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5217/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,001,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5218/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,001,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5219/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=1,002,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5220/500000]
+ optim/total_grad_norm=2.055
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,002,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5221/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,002,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5222/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,002,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5223/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,002,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5224/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,003,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5225/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,003,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5226/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,003,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5227/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,003,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5228/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,003,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5229/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,003,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5230/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,004,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5231/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,004,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5232/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,004,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5233/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,004,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5234/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,004,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5235/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,005,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5236/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,005,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5237/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,005,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5238/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,005,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5239/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,005,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5240/500000]
+ optim/total_grad_norm=1.035
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,006,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5241/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,006,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5242/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,006,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5243/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,006,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5244/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,006,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5245/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,007,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5246/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,007,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5247/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,007,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5248/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,007,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5249/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,007,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5250/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,008,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5251/500000]
+ train/ActionNoiseL2Loss=0.1304
+ throughput/total_tokens=1,008,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5252/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,008,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5253/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,008,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5254/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,008,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5255/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,008,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5256/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,009,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5257/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,009,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5258/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,009,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5259/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=1,009,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5260/500000]
+ optim/total_grad_norm=1.392
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,009,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5261/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,010,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5262/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,010,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5263/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,010,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5264/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,010,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5265/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,010,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5266/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,011,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5267/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,011,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5268/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,011,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5269/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,011,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5270/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,011,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5271/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,012,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5272/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,012,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5273/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,012,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5274/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,012,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5275/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,012,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5276/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,012,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5277/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,013,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5278/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,013,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5279/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,013,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5280/500000]
+ optim/total_grad_norm=1.752
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,013,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5281/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,013,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5282/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,014,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5283/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,014,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5284/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,014,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5285/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,014,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5286/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,014,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5287/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,015,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5288/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,015,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5289/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,015,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5290/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,015,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5291/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,015,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5292/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,016,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5293/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,016,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5294/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,016,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5295/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,016,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5296/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,016,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5297/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,017,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5298/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,017,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5299/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,017,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5300/500000]
+ optim/total_grad_norm=1.809
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,017,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5301/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,017,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5302/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,017,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5303/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,018,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5304/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,018,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5305/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,018,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5306/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,018,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5307/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,018,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5308/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,019,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5309/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,019,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5310/500000]
+ train/ActionNoiseL2Loss=0.1323
+ throughput/total_tokens=1,019,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5311/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,019,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5312/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,019,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5313/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,020,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5314/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,020,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5315/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,020,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5316/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,020,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5317/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,020,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5318/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,021,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5319/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,021,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5320/500000]
+ optim/total_grad_norm=1.366
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,021,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5321/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,021,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5322/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,021,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5323/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,022,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5324/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,022,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5325/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,022,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5326/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,022,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5327/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,022,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5328/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,022,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5329/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,023,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5330/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,023,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5331/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,023,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5332/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,023,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5333/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,023,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5334/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,024,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5335/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,024,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5336/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,024,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5337/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,024,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5338/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,024,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5339/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,025,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5340/500000]
+ optim/total_grad_norm=1.232
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,025,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5341/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,025,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5342/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,025,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5343/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,025,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5344/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,026,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5345/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,026,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5346/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,026,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5347/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,026,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5348/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,026,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5349/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,027,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5350/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,027,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5351/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=1,027,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5352/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,027,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5353/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,027,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5354/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,027,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5355/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,028,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5356/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,028,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5357/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,028,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5358/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,028,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5359/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,028,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5360/500000]
+ optim/total_grad_norm=1.559
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,029,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5361/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,029,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5362/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,029,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5363/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,029,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5364/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,029,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5365/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,030,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5366/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,030,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5367/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,030,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5368/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,030,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5369/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,030,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5370/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,031,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5371/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,031,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5372/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,031,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5373/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,031,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5374/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,031,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5375/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,032,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5376/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,032,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5377/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,032,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5378/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,032,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5379/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,032,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5380/500000]
+ optim/total_grad_norm=1.434
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,032,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5381/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,033,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5382/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,033,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5383/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,033,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5384/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,033,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5385/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,033,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5386/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,034,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5387/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,034,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5388/500000]
+ train/ActionNoiseL2Loss=0.1450
+ throughput/total_tokens=1,034,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5389/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,034,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5390/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,034,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5391/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=1,035,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5392/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,035,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5393/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,035,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5394/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,035,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5395/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,035,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5396/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,036,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5397/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,036,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5398/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,036,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5399/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,036,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5400/500000]
+ optim/total_grad_norm=2.230
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,036,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5401/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,036,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5402/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,037,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5403/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,037,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5404/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,037,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5405/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,037,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5406/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,037,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5407/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=1,038,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5408/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,038,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5409/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,038,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5410/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,038,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=5411/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,038,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5412/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,039,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5413/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,039,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5414/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,039,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5415/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,039,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5416/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,039,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5417/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,040,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5418/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,040,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5419/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,040,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5420/500000]
+ optim/total_grad_norm=1.080
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,040,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5421/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,040,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5422/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,041,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5423/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,041,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5424/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,041,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5425/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,041,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5426/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,041,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5427/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,041,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5428/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,042,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5429/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,042,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5430/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,042,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5431/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,042,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5432/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,042,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5433/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,043,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5434/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,043,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5435/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,043,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5436/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,043,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5437/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,043,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5438/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,044,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5439/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,044,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5440/500000]
+ optim/total_grad_norm=1.430
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,044,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5441/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,044,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5442/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=1,044,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5443/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,045,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5444/500000]
+ train/ActionNoiseL2Loss=0.1447
+ throughput/total_tokens=1,045,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5445/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,045,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5446/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,045,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5447/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=1,045,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5448/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,046,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5449/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,046,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5450/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,046,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5451/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,046,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5452/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,046,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5453/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,046,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5454/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,047,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5455/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,047,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5456/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,047,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5457/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,047,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5458/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,047,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5459/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,048,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5460/500000]
+ optim/total_grad_norm=1.051
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,048,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5461/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,048,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5462/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,048,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5463/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,048,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5464/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,049,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5465/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,049,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5466/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,049,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5467/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,049,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5468/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,049,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5469/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,050,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5470/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,050,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5471/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,050,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5472/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,050,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5473/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,050,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5474/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,051,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5475/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,051,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5476/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,051,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5477/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,051,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5478/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,051,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5479/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,051,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5480/500000]
+ optim/total_grad_norm=1.396
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,052,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5481/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,052,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5482/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,052,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5483/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,052,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5484/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,052,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5485/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,053,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5486/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,053,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5487/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,053,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5488/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,053,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5489/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,053,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5490/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,054,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5491/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,054,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5492/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,054,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=5493/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,054,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5494/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,054,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5495/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,055,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5496/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,055,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5497/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,055,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5498/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,055,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5499/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,055,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5500/500000]
+ optim/total_grad_norm=1.501
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,056,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/04 [01:12:23] INFO | >> Saving config... checkpoint.py:608
+10/04 [01:13:19] INFO | >> Saving model state... checkpoint.py:796
+10/04 [01:14:31] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [01:16:04] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5501/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,056,192,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=5502/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,056,384,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+[step=5503/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,056,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=5504/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,056,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=5505/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,056,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=5506/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,057,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5507/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,057,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5508/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,057,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5509/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,057,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5510/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,057,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5511/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,058,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5512/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,058,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5513/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,058,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5514/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,058,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5515/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,058,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5516/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,059,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5517/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,059,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5518/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,059,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5519/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,059,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5520/500000]
+ optim/total_grad_norm=1.161
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,059,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5521/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,060,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5522/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,060,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5523/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,060,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5524/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,060,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5525/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,060,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5526/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,060,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5527/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,061,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5528/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,061,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5529/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,061,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5530/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,061,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5531/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,061,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5532/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,062,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5533/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,062,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5534/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,062,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5535/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,062,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5536/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,062,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5537/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,063,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5538/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,063,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5539/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,063,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5540/500000]
+ optim/total_grad_norm=1.551
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,063,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5541/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,063,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5542/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,064,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5543/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,064,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5544/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,064,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5545/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,064,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5546/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,064,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5547/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,065,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5548/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,065,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5549/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,065,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5550/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,065,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5551/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,065,792,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5552/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,065,984,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5553/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,066,176,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5554/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,066,368,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5555/500000]
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=1,066,560,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5556/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,066,752,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5557/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,066,944,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5558/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,067,136,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5559/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,067,328,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5560/500000]
+ optim/total_grad_norm=1.199
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,067,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5561/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,067,712,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5562/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,067,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5563/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,068,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5564/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,068,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5565/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,068,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5566/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,068,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5567/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,068,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5568/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,069,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5569/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,069,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5570/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,069,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5571/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,069,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5572/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,069,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5573/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,070,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5574/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,070,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5575/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,070,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5576/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,070,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5577/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,070,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5578/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,070,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5579/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,071,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5580/500000]
+ optim/total_grad_norm=1.731
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,071,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5581/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,071,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5582/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,071,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5583/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,071,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5584/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,072,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5585/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,072,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5586/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,072,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5587/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,072,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5588/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,072,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5589/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,073,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5590/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,073,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5591/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,073,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5592/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,073,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5593/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,073,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5594/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,074,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5595/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,074,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5596/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,074,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5597/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,074,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5598/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,074,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5599/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,075,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5600/500000]
+ optim/total_grad_norm=3.920
+ train/ActionNoiseL2Loss=0.1327
+ throughput/total_tokens=1,075,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5601/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,075,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5602/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,075,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5603/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,075,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5604/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,075,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5605/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,076,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5606/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,076,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5607/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,076,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5608/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,076,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5609/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,076,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5610/500000]
+ train/ActionNoiseL2Loss=0.1772
+ throughput/total_tokens=1,077,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5611/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,077,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5612/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,077,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5613/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,077,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5614/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,077,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5615/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,078,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5616/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,078,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5617/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,078,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5618/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,078,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5619/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,078,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5620/500000]
+ optim/total_grad_norm=1.343
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,079,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5621/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,079,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5622/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,079,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5623/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,079,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5624/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,079,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5625/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,080,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5626/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,080,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5627/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,080,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5628/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,080,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5629/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,080,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5630/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,080,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5631/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,081,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5632/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,081,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5633/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,081,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5634/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,081,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5635/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,081,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5636/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,082,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5637/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,082,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5638/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,082,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5639/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,082,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5640/500000]
+ optim/total_grad_norm=1.568
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,082,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5641/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,083,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5642/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,083,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5643/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,083,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5644/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,083,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5645/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,083,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5646/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,084,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5647/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,084,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5648/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,084,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5649/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,084,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5650/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=1,084,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5651/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,084,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5652/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,085,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5653/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,085,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5654/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,085,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5655/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=1,085,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5656/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,085,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5657/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,086,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5658/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,086,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5659/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,086,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5660/500000]
+ optim/total_grad_norm=1.801
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,086,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5661/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,086,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5662/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,087,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5663/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,087,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5664/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,087,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5665/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,087,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5666/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,087,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5667/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,088,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5668/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,088,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5669/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,088,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5670/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,088,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5671/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,088,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5672/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,089,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5673/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,089,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5674/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,089,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5675/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,089,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5676/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,089,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5677/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,089,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5678/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,090,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5679/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,090,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5680/500000]
+ optim/total_grad_norm=1.606
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,090,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5681/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,090,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5682/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,090,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5683/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,091,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5684/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,091,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5685/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,091,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5686/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,091,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5687/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,091,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5688/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,092,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5689/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,092,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5690/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,092,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5691/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,092,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5692/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,092,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5693/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,093,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5694/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,093,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5695/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,093,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5696/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,093,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5697/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,093,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5698/500000]
+ train/ActionNoiseL2Loss=0.0118
+ throughput/total_tokens=1,094,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5699/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,094,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5700/500000]
+ optim/total_grad_norm=1.734
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,094,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5701/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,094,592,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5702/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,094,784,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5703/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,094,976,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5704/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,095,168,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5705/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,095,360,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5706/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,095,552,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5707/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,095,744,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5708/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,095,936,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5709/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,096,128,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5710/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,096,320,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=46,467
+[step=5711/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,096,512,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5712/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,096,704,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5713/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,096,896,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5714/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,097,088,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5715/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,097,280,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5716/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,097,472,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5717/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,097,664,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5718/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,097,856,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5719/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,098,048,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=5720/500000]
+ optim/total_grad_norm=1.335
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,098,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5721/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,098,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5722/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,098,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5723/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,098,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5724/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,099,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5725/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,099,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5726/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,099,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5727/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,099,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5728/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,099,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5729/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,099,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5730/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,100,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5731/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,100,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5732/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,100,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5733/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,100,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5734/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,100,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5735/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,101,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5736/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,101,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5737/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,101,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5738/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,101,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5739/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,101,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5740/500000]
+ optim/total_grad_norm=1.136
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,102,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5741/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,102,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5742/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,102,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5743/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,102,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5744/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,102,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5745/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,103,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5746/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,103,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5747/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,103,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5748/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,103,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5749/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,103,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5750/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,104,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5751/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,104,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5752/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,104,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5753/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,104,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5754/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,104,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5755/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,104,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5756/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,105,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5757/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,105,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5758/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,105,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5759/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,105,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5760/500000]
+ optim/total_grad_norm=0.9223
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,105,920,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5761/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,106,112,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5762/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,106,304,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5763/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,106,496,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5764/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,106,688,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5765/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,106,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5766/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,107,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5767/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,107,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5768/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,107,456,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5769/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,107,648,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5770/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,107,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5771/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,108,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5772/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=1,108,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5773/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,108,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5774/500000]
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=1,108,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5775/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,108,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5776/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,108,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5777/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,109,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5778/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,109,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5779/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,109,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5780/500000]
+ optim/total_grad_norm=1.656
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,109,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5781/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,109,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5782/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,110,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5783/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,110,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5784/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,110,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5785/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,110,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5786/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,110,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5787/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,111,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5788/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,111,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5789/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,111,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5790/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,111,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5791/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,111,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5792/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,112,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5793/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,112,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5794/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,112,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5795/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,112,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5796/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,112,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5797/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,113,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5798/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,113,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5799/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,113,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5800/500000]
+ optim/total_grad_norm=1.030
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,113,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5801/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,113,792,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5802/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,113,984,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5803/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,114,176,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5804/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,114,368,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5805/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,114,560,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5806/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,114,752,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5807/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,114,944,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5808/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,115,136,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5809/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,115,328,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5810/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,115,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5811/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,115,712,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5812/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,115,904,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5813/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,116,096,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5814/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,116,288,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5815/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,116,480,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5816/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,116,672,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5817/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,116,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5818/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,117,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5819/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,117,248,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5820/500000]
+ optim/total_grad_norm=0.8309
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,117,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5821/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,117,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5822/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,117,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5823/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,118,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5824/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,118,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5825/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,118,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5826/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,118,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5827/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,118,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5828/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,118,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5829/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,119,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5830/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,119,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5831/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,119,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5832/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,119,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5833/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,119,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5834/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,120,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5835/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,120,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5836/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,120,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5837/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,120,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5838/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,120,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5839/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,121,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5840/500000]
+ optim/total_grad_norm=1.263
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,121,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5841/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,121,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5842/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,121,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5843/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,121,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5844/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,122,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5845/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,122,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5846/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,122,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5847/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,122,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5848/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,122,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5849/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=1,123,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5850/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,123,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5851/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,123,392,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5852/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,123,584,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5853/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,123,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5854/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,123,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5855/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,124,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5856/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,124,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5857/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,124,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5858/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,124,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5859/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,124,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5860/500000]
+ optim/total_grad_norm=1.627
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,125,120,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5861/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,125,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5862/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,125,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5863/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=1,125,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5864/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,125,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5865/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,126,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5866/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,126,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5867/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,126,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5868/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,126,656,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5869/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,126,848,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5870/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,127,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5871/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,127,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5872/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,127,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5873/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,127,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5874/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,127,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5875/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,128,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5876/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,128,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5877/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,128,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5878/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,128,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5879/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,128,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5880/500000]
+ optim/total_grad_norm=0.9228
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,128,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5881/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=1,129,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5882/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,129,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5883/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,129,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5884/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,129,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5885/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,129,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5886/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=1,130,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5887/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,130,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5888/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,130,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5889/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,130,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5890/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=1,130,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5891/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,131,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5892/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,131,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5893/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,131,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5894/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,131,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5895/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,131,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5896/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,132,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5897/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,132,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5898/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,132,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5899/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,132,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5900/500000]
+ optim/total_grad_norm=1.191
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,132,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=5901/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,132,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5902/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,133,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5903/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,133,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5904/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=1,133,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5905/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,133,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5906/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,133,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5907/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,134,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5908/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,134,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5909/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,134,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5910/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,134,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5911/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,134,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5912/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,135,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5913/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,135,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5914/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,135,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5915/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,135,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5916/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,135,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5917/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,136,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5918/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,136,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5919/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,136,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5920/500000]
+ optim/total_grad_norm=1.584
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,136,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5921/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,136,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5922/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,137,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5923/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,137,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5924/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,137,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5925/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,137,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5926/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,137,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5927/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,137,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5928/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=1,138,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5929/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,138,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5930/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,138,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5931/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,138,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5932/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,138,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5933/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,139,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5934/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,139,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5935/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,139,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5936/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,139,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5937/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,139,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5938/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,140,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5939/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,140,288,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5940/500000]
+ optim/total_grad_norm=2.097
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,140,480,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5941/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,140,672,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=5942/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,140,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5943/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,141,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5944/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,141,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5945/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,141,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5946/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,141,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5947/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=1,141,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5948/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,142,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5949/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,142,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5950/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,142,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5951/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,142,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=5952/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,142,784,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=5953/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,142,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=5954/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,143,168,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=5955/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,143,360,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5956/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,143,552,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=5957/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,143,744,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=5958/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,143,936,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5959/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,144,128,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5960/500000]
+ optim/total_grad_norm=0.9673
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,144,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=5961/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,144,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5962/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,144,704,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=5963/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,144,896,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5964/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,145,088,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5965/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,145,280,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5966/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,145,472,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5967/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,145,664,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5968/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,145,856,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5969/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=1,146,048,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=5970/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,146,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5971/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,146,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5972/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,146,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5973/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,146,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5974/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,147,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5975/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,147,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5976/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,147,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5977/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,147,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5978/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,147,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5979/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,147,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5980/500000]
+ optim/total_grad_norm=1.550
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,148,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5981/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,148,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5982/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,148,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5983/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,148,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5984/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,148,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5985/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,149,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5986/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,149,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5987/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,149,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5988/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,149,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5989/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,149,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5990/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,150,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=5991/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,150,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5992/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,150,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5993/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,150,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5994/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,150,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5995/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,151,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5996/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,151,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5997/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,151,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5998/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,151,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=5999/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,151,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6000/500000]
+ optim/total_grad_norm=1.340
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,152,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+10/04 [04:10:29] INFO | >> Saving config... checkpoint.py:608
+10/04 [04:11:13] INFO | >> Saving model state... checkpoint.py:796
+10/04 [04:12:21] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [04:13:51] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6001/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,152,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6002/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,152,384,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=6003/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,152,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=6004/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,152,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6005/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,152,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6006/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,153,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6007/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,153,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6008/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,153,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6009/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,153,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6010/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,153,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6011/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,154,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6012/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,154,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6013/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,154,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6014/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,154,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6015/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,154,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6016/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,155,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6017/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,155,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6018/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,155,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6019/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,155,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6020/500000]
+ optim/total_grad_norm=1.091
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,155,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6021/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,156,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6022/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,156,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6023/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,156,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6024/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,156,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6025/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,156,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6026/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,156,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6027/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,157,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6028/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,157,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6029/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,157,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6030/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,157,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6031/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,157,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6032/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,158,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6033/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,158,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6034/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,158,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6035/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,158,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6036/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,158,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6037/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,159,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6038/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,159,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6039/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=1,159,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6040/500000]
+ optim/total_grad_norm=1.814
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,159,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6041/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,159,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6042/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,160,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6043/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,160,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6044/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,160,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6045/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,160,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6046/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,160,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6047/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,161,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6048/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,161,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6049/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,161,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6050/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,161,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6051/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=1,161,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6052/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,161,984,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6053/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,162,176,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6054/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,162,368,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6055/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,162,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6056/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,162,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6057/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,162,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6058/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,163,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6059/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=1,163,328,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6060/500000]
+ optim/total_grad_norm=1.053
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,163,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6061/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,163,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6062/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,163,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6063/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,164,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6064/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,164,288,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6065/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,164,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6066/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,164,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6067/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,164,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6068/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,165,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6069/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,165,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6070/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,165,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6071/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,165,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6072/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,165,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6073/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,166,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6074/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,166,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6075/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,166,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6076/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,166,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6077/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,166,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6078/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,166,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6079/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,167,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6080/500000]
+ optim/total_grad_norm=1.586
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,167,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6081/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,167,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6082/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,167,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6083/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,167,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6084/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,168,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6085/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,168,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6086/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,168,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6087/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,168,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6088/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,168,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6089/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,169,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6090/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,169,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6091/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,169,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6092/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,169,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6093/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,169,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6094/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,170,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6095/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,170,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6096/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,170,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6097/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,170,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6098/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,170,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6099/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,171,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6100/500000]
+ optim/total_grad_norm=1.478
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,171,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6101/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,171,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6102/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,171,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6103/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,171,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6104/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,171,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6105/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,172,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6106/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,172,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6107/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,172,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6108/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,172,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6109/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,172,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6110/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,173,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6111/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,173,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6112/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,173,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6113/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,173,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6114/500000]
+ train/ActionNoiseL2Loss=0.1239
+ throughput/total_tokens=1,173,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6115/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,174,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6116/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,174,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6117/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,174,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6118/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,174,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6119/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,174,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6120/500000]
+ optim/total_grad_norm=1.470
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,175,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6121/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,175,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6122/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,175,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6123/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,175,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6124/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,175,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6125/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,176,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6126/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,176,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6127/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,176,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6128/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,176,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6129/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,176,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6130/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,176,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6131/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,177,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6132/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,177,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6133/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,177,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6134/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,177,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6135/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,177,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6136/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,178,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6137/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,178,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6138/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,178,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6139/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,178,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6140/500000]
+ optim/total_grad_norm=1.431
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,178,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6141/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,179,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6142/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,179,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6143/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,179,456,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6144/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,179,648,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6145/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=1,179,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6146/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,180,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6147/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,180,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6148/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,180,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6149/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,180,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6150/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,180,800,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6151/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,180,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6152/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,181,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6153/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,181,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6154/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,181,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6155/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,181,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6156/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,181,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6157/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,182,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6158/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,182,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6159/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,182,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6160/500000]
+ optim/total_grad_norm=1.692
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,182,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=6161/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,182,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6162/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,183,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6163/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,183,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6164/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,183,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6165/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,183,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6166/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,183,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6167/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,184,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6168/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=1,184,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6169/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,184,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6170/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,184,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6171/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,184,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6172/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,185,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6173/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,185,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6174/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,185,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6175/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,185,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6176/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,185,792,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6177/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,185,984,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6178/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,186,176,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6179/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,186,368,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6180/500000]
+ optim/total_grad_norm=2.576
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=1,186,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6181/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,186,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6182/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,186,944,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6183/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,187,136,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6184/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=1,187,328,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6185/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,187,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6186/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,187,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6187/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,187,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6188/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,188,096,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6189/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,188,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6190/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,188,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6191/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,188,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6192/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,188,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6193/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,189,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6194/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,189,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6195/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,189,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6196/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,189,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6197/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,189,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6198/500000]
+ train/ActionNoiseL2Loss=0.1259
+ throughput/total_tokens=1,190,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6199/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,190,208,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6200/500000]
+ optim/total_grad_norm=1.257
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,190,400,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6201/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,190,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6202/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,190,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6203/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,190,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6204/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,191,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6205/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,191,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6206/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,191,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6207/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,191,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6208/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,191,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6209/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,192,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6210/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,192,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=6211/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,192,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6212/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,192,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6213/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,192,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6214/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,193,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6215/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,193,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6216/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,193,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6217/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=1,193,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6218/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,193,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6219/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=1,194,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6220/500000]
+ optim/total_grad_norm=1.149
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,194,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6221/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,194,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6222/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,194,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6223/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,194,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6224/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,195,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6225/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,195,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6226/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=1,195,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6227/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,195,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6228/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=1,195,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6229/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,195,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6230/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,196,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6231/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,196,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6232/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,196,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6233/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,196,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6234/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,196,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6235/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,197,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6236/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,197,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6237/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,197,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6238/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,197,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6239/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,197,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6240/500000]
+ optim/total_grad_norm=1.694
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,198,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6241/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,198,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6242/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,198,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6243/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,198,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6244/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,198,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6245/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,199,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6246/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,199,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6247/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,199,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6248/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,199,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6249/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,199,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6250/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,200,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6251/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,200,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6252/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,200,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6253/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,200,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6254/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,200,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6255/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,200,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6256/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,201,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6257/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,201,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6258/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,201,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6259/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,201,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6260/500000]
+ optim/total_grad_norm=1.641
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,201,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6261/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,202,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6262/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,202,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6263/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,202,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6264/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,202,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6265/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,202,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6266/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,203,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6267/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,203,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6268/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,203,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6269/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,203,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6270/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,203,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6271/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,204,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6272/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,204,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6273/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,204,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6274/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,204,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6275/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,204,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6276/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,204,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6277/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,205,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6278/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,205,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6279/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,205,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6280/500000]
+ optim/total_grad_norm=0.9741
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,205,760,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6281/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,205,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6282/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,206,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6283/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,206,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6284/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,206,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6285/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,206,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6286/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,206,912,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6287/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,207,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6288/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,207,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6289/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,207,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6290/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,207,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6291/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,207,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6292/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,208,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6293/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,208,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6294/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,208,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6295/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,208,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6296/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,208,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6297/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,209,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6298/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,209,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6299/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,209,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6300/500000]
+ optim/total_grad_norm=1.976
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,209,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6301/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,209,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6302/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,209,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6303/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,210,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6304/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,210,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6305/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,210,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6306/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,210,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6307/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,210,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6308/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,211,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6309/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,211,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6310/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,211,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6311/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,211,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6312/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,211,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6313/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,212,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6314/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,212,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6315/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,212,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6316/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,212,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6317/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,212,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6318/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,213,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6319/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,213,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6320/500000]
+ optim/total_grad_norm=1.728
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,213,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6321/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,213,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6322/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,213,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6323/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,214,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6324/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,214,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6325/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,214,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6326/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,214,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6327/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,214,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6328/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,214,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6329/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,215,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6330/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,215,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6331/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,215,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6332/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,215,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6333/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,215,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6334/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,216,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6335/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,216,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6336/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,216,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6337/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,216,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6338/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=1,216,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6339/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,217,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6340/500000]
+ optim/total_grad_norm=0.5985
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,217,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6341/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,217,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6342/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,217,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6343/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,217,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6344/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,218,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6345/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,218,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6346/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=1,218,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6347/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,218,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6348/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,218,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6349/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,219,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6350/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,219,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6351/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,219,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6352/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,219,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6353/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,219,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6354/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,219,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6355/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,220,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6356/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,220,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6357/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,220,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6358/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,220,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6359/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,220,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6360/500000]
+ optim/total_grad_norm=1.878
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,221,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6361/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,221,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6362/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,221,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6363/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,221,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6364/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,221,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6365/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,222,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6366/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,222,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6367/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,222,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6368/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,222,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6369/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,222,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6370/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,223,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6371/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,223,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6372/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,223,424,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6373/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=1,223,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6374/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,223,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6375/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,224,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6376/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,224,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6377/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,224,384,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6378/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,224,576,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6379/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,224,768,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6380/500000]
+ optim/total_grad_norm=2.133
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,224,960,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6381/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,225,152,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6382/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,225,344,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6383/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,225,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6384/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,225,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6385/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,225,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6386/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,226,112,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6387/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,226,304,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6388/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,226,496,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6389/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,226,688,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6390/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,226,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6391/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,227,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6392/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,227,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6393/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,227,456,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6394/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,227,648,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6395/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,227,840,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6396/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,228,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6397/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,228,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6398/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,228,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6399/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,228,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6400/500000]
+ optim/total_grad_norm=1.498
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,228,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6401/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,228,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6402/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,229,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6403/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,229,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6404/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,229,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6405/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,229,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6406/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,229,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6407/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,230,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6408/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,230,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6409/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,230,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6410/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,230,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6411/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,230,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6412/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,231,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6413/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,231,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6414/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,231,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6415/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,231,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6416/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,231,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6417/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,232,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6418/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,232,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6419/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,232,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6420/500000]
+ optim/total_grad_norm=1.342
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,232,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6421/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,232,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6422/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,233,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6423/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,233,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6424/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,233,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6425/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,233,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6426/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,233,792,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6427/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,233,984,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6428/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,234,176,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6429/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,234,368,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6430/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,234,560,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6431/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,234,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6432/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,234,944,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6433/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,235,136,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6434/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,235,328,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6435/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,235,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6436/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,235,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6437/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,235,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6438/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,236,096,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6439/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,236,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6440/500000]
+ optim/total_grad_norm=1.105
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,236,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6441/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,236,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6442/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,236,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6443/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,237,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6444/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,237,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6445/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,237,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6446/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,237,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6447/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,237,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6448/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,238,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6449/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=1,238,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6450/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,238,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6451/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,238,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6452/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,238,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6453/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,238,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6454/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,239,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6455/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,239,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6456/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,239,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6457/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,239,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6458/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,239,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6459/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,240,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6460/500000]
+ optim/total_grad_norm=2.432
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=1,240,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=6461/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,240,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6462/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,240,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6463/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,240,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6464/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,241,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6465/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,241,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6466/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,241,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6467/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,241,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6468/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,241,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6469/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,242,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6470/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,242,240,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6471/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,242,432,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6472/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,242,624,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6473/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,242,816,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6474/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=1,243,008,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6475/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,243,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6476/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,243,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6477/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,243,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6478/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,243,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6479/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,243,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6480/500000]
+ optim/total_grad_norm=0.7439
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,244,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6481/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,244,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6482/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,244,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6483/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,244,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6484/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,244,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6485/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,245,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6486/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,245,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6487/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,245,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6488/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,245,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6489/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,245,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6490/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,246,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6491/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=1,246,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6492/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,246,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6493/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,246,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6494/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,246,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6495/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,247,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6496/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,247,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6497/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,247,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6498/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,247,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6499/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,247,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6500/500000]
+ optim/total_grad_norm=1.263
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,248,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/04 [07:08:37] INFO | >> Saving config... checkpoint.py:608
+10/04 [07:09:08] INFO | >> Saving model state... checkpoint.py:796
+10/04 [07:10:20] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [07:11:51] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6501/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,248,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6502/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,248,384,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=6503/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,248,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=6504/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,248,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=6505/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,248,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=6506/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,249,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=6507/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,249,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=6508/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,249,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6509/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,249,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=6510/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,249,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6511/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,250,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6512/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,250,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6513/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,250,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6514/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,250,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6515/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,250,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6516/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,251,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6517/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,251,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6518/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,251,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6519/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,251,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6520/500000]
+ optim/total_grad_norm=2.522
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=1,251,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6521/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,252,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6522/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,252,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6523/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,252,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6524/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,252,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6525/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,252,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6526/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,252,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6527/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,253,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6528/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,253,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6529/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,253,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6530/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,253,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6531/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,253,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6532/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,254,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6533/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,254,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6534/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,254,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6535/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,254,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6536/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,254,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6537/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,255,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6538/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,255,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6539/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,255,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6540/500000]
+ optim/total_grad_norm=1.195
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,255,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6541/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,255,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6542/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,256,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6543/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,256,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6544/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,256,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6545/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,256,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6546/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,256,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6547/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,257,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6548/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,257,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6549/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,257,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6550/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,257,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6551/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,257,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6552/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,257,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6553/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,258,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6554/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,258,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6555/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,258,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6556/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,258,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6557/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,258,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6558/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,259,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6559/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,259,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6560/500000]
+ optim/total_grad_norm=1.937
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,259,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6561/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,259,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6562/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,259,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6563/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,260,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6564/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,260,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6565/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,260,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6566/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,260,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6567/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,260,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6568/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,261,056,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6569/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,261,248,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6570/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,261,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6571/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,261,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6572/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,261,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6573/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,262,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6574/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,262,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6575/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,262,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6576/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,262,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6577/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,262,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6578/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,262,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6579/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,263,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6580/500000]
+ optim/total_grad_norm=0.8993
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,263,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6581/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,263,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6582/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,263,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6583/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,263,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6584/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,264,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6585/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,264,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6586/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,264,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6587/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,264,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6588/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,264,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6589/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,265,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6590/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,265,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6591/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,265,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6592/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,265,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6593/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,265,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6594/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,266,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6595/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,266,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6596/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,266,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6597/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,266,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6598/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,266,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6599/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,267,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6600/500000]
+ optim/total_grad_norm=2.898
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,267,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6601/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,267,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6602/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,267,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6603/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,267,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6604/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,267,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6605/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,268,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6606/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,268,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6607/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,268,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6608/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,268,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6609/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,268,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6610/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,269,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6611/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,269,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6612/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,269,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6613/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,269,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6614/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,269,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6615/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,270,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6616/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,270,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6617/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,270,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6618/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,270,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6619/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,270,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6620/500000]
+ optim/total_grad_norm=1.248
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,271,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6621/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,271,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6622/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,271,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6623/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,271,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6624/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,271,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6625/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,272,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6626/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,272,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6627/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,272,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6628/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,272,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6629/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,272,768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6630/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,272,960,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6631/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,273,152,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6632/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,273,344,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6633/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,273,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6634/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,273,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6635/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,273,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6636/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,274,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6637/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,274,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6638/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,274,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6639/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,274,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6640/500000]
+ optim/total_grad_norm=1.770
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,274,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6641/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,275,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6642/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,275,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6643/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,275,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6644/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,275,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6645/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,275,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6646/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,276,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6647/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,276,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6648/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,276,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6649/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,276,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6650/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,276,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6651/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,276,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6652/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,277,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6653/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,277,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6654/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,277,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6655/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,277,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6656/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,277,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6657/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,278,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6658/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,278,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6659/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,278,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6660/500000]
+ optim/total_grad_norm=1.324
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,278,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6661/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,278,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6662/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,279,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6663/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,279,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6664/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,279,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6665/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,279,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6666/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,279,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6667/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,280,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6668/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=1,280,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6669/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,280,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6670/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,280,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6671/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,280,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6672/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=1,281,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6673/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,281,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6674/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,281,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6675/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,281,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6676/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,281,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6677/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,281,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6678/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,282,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6679/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,282,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6680/500000]
+ optim/total_grad_norm=1.252
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,282,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6681/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,282,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6682/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,282,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6683/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,283,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6684/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,283,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6685/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=1,283,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6686/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,283,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6687/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,283,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6688/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,284,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6689/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,284,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6690/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,284,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6691/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,284,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6692/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,284,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6693/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,285,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6694/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,285,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6695/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,285,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6696/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,285,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6697/500000]
+ train/ActionNoiseL2Loss=0.1659
+ throughput/total_tokens=1,285,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6698/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,286,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6699/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,286,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6700/500000]
+ optim/total_grad_norm=0.9798
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,286,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6701/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,286,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6702/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=1,286,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6703/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,286,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6704/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,287,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6705/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,287,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6706/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,287,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6707/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,287,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6708/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,287,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6709/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,288,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6710/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,288,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=6711/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,288,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6712/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,288,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6713/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=1,288,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6714/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,289,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6715/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,289,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6716/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,289,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6717/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,289,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6718/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,289,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6719/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,290,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6720/500000]
+ optim/total_grad_norm=1.097
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,290,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6721/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,290,432,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6722/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,290,624,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6723/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,290,816,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6724/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,291,008,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6725/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,291,200,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6726/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,291,392,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6727/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,291,584,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=6728/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,291,776,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6729/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,291,968,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6730/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,292,160,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6731/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,292,352,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6732/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,292,544,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6733/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,292,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6734/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,292,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6735/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,293,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6736/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,293,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6737/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,293,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6738/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,293,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6739/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,293,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6740/500000]
+ optim/total_grad_norm=1.422
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,294,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6741/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,294,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6742/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,294,464,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6743/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,294,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6744/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,294,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6745/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=1,295,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6746/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,295,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6747/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,295,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6748/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,295,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6749/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,295,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6750/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,296,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6751/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,296,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6752/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,296,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6753/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,296,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6754/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,296,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6755/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,296,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6756/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,297,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6757/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,297,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6758/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,297,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6759/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=1,297,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6760/500000]
+ optim/total_grad_norm=1.208
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,297,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6761/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=1,298,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6762/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,298,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6763/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,298,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6764/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,298,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6765/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,298,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6766/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,299,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6767/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,299,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6768/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,299,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6769/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,299,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6770/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,299,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6771/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,300,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6772/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,300,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6773/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,300,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6774/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,300,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6775/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,300,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6776/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,300,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6777/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,301,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6778/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,301,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6779/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,301,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6780/500000]
+ optim/total_grad_norm=1.353
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,301,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6781/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,301,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6782/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,302,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6783/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,302,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6784/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,302,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6785/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=1,302,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6786/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,302,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6787/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,303,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6788/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,303,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6789/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,303,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6790/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,303,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6791/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,303,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6792/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,304,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6793/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,304,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6794/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,304,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6795/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,304,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6796/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,304,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6797/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,305,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6798/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,305,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6799/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,305,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6800/500000]
+ optim/total_grad_norm=1.381
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,305,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6801/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,305,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6802/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,305,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6803/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,306,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6804/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,306,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6805/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,306,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6806/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,306,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6807/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,306,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6808/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,307,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6809/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,307,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6810/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,307,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6811/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,307,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6812/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,307,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6813/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,308,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6814/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,308,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6815/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,308,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6816/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,308,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6817/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,308,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6818/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,309,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6819/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,309,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6820/500000]
+ optim/total_grad_norm=1.159
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,309,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6821/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=1,309,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6822/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,309,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6823/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,310,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6824/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,310,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6825/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,310,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6826/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,310,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6827/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,310,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6828/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,310,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6829/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,311,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6830/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,311,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6831/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,311,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6832/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,311,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6833/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,311,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6834/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,312,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6835/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,312,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6836/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,312,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6837/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,312,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6838/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,312,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6839/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,313,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6840/500000]
+ optim/total_grad_norm=1.330
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,313,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6841/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,313,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6842/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,313,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6843/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,313,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6844/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,314,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6845/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,314,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6846/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,314,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6847/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,314,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6848/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,314,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6849/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,315,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6850/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,315,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6851/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,315,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6852/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,315,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6853/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,315,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6854/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,315,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6855/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,316,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6856/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,316,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6857/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,316,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6858/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,316,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6859/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,316,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6860/500000]
+ optim/total_grad_norm=2.081
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,317,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6861/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,317,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6862/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,317,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6863/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,317,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6864/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,317,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6865/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,318,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6866/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,318,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6867/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,318,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6868/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,318,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6869/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,318,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6870/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,319,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6871/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,319,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6872/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,319,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6873/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,319,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6874/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,319,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6875/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,320,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6876/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,320,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6877/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,320,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6878/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,320,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6879/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,320,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6880/500000]
+ optim/total_grad_norm=1.147
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,320,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6881/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,321,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6882/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,321,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6883/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,321,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6884/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,321,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6885/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,321,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6886/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,322,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6887/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,322,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6888/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,322,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6889/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,322,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6890/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,322,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6891/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,323,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6892/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,323,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6893/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,323,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6894/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,323,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6895/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,323,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6896/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,324,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=6897/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,324,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6898/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,324,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6899/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,324,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6900/500000]
+ optim/total_grad_norm=1.509
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,324,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=6901/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,324,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6902/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,325,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6903/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,325,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6904/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,325,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6905/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,325,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6906/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,325,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6907/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,326,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6908/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,326,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6909/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,326,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6910/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,326,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6911/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,326,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6912/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,327,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6913/500000]
+ train/ActionNoiseL2Loss=0.0107
+ throughput/total_tokens=1,327,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6914/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,327,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6915/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,327,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6916/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,327,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6917/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,328,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6918/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,328,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6919/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,328,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6920/500000]
+ optim/total_grad_norm=1.323
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,328,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6921/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,328,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6922/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,329,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6923/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,329,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6924/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,329,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6925/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,329,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6926/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,329,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6927/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,329,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6928/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,330,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6929/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,330,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6930/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,330,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6931/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,330,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6932/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,330,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6933/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,331,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6934/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,331,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6935/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,331,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6936/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,331,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6937/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,331,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6938/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,332,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6939/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,332,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6940/500000]
+ optim/total_grad_norm=1.061
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,332,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6941/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,332,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6942/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,332,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6943/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,333,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6944/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,333,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6945/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,333,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6946/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,333,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6947/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,333,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6948/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,334,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6949/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,334,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=6950/500000]
+ train/ActionNoiseL2Loss=0.0127
+ throughput/total_tokens=1,334,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6951/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,334,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6952/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,334,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6953/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,334,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6954/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,335,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6955/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,335,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6956/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,335,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6957/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,335,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6958/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,335,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6959/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,336,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6960/500000]
+ optim/total_grad_norm=0.8903
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,336,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=6961/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,336,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6962/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,336,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6963/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,336,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6964/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,337,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6965/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,337,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6966/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,337,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6967/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,337,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6968/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,337,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6969/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,338,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6970/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,338,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6971/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,338,432,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6972/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,338,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6973/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,338,816,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=6974/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,339,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6975/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,339,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6976/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,339,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6977/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,339,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6978/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,339,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6979/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,339,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6980/500000]
+ optim/total_grad_norm=1.346
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,340,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6981/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,340,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6982/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,340,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6983/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,340,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6984/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,340,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6985/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,341,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6986/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,341,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6987/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,341,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6988/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,341,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6989/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,341,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6990/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,342,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=6991/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,342,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6992/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,342,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6993/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=1,342,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6994/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,342,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6995/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,343,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6996/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,343,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6997/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,343,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6998/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,343,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=6999/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=1,343,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7000/500000]
+ optim/total_grad_norm=1.031
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,344,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/04 [10:06:14] INFO | >> Saving config... checkpoint.py:608
+10/04 [10:07:06] INFO | >> Saving model state... checkpoint.py:796
+10/04 [10:08:18] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [10:09:49] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7001/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=1,344,192,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7002/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,344,384,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=7003/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,344,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=7004/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,344,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7005/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,344,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7006/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,345,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7007/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,345,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=7008/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,345,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=7009/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,345,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=7010/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=1,345,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7011/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,346,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7012/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,346,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7013/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,346,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7014/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,346,688,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7015/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,346,880,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7016/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,347,072,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7017/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,347,264,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7018/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,347,456,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7019/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,347,648,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7020/500000]
+ optim/total_grad_norm=1.522
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,347,840,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7021/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,348,032,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7022/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,348,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7023/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=1,348,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7024/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,348,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7025/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,348,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7026/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,348,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7027/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,349,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7028/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,349,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7029/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,349,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7030/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,349,760,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7031/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,349,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7032/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,350,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7033/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,350,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7034/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,350,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7035/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,350,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7036/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,350,912,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7037/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,351,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7038/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,351,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7039/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,351,488,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7040/500000]
+ optim/total_grad_norm=0.5655
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,351,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7041/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,351,872,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7042/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=1,352,064,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7043/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,352,256,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7044/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,352,448,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7045/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,352,640,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7046/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,352,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7047/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,353,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7048/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,353,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7049/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,353,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7050/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,353,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7051/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,353,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7052/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,353,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7053/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,354,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7054/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,354,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7055/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,354,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7056/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,354,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7057/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,354,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7058/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,355,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7059/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,355,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7060/500000]
+ optim/total_grad_norm=0.7453
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,355,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7061/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,355,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7062/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,355,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7063/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,356,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7064/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,356,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7065/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=1,356,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7066/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,356,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7067/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,356,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7068/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,357,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7069/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,357,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7070/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,357,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7071/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,357,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7072/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=1,357,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7073/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,358,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7074/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,358,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7075/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,358,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7076/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,358,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7077/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,358,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7078/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,358,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7079/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,359,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7080/500000]
+ optim/total_grad_norm=1.224
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,359,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7081/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=1,359,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7082/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,359,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7083/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,359,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7084/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,360,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7085/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,360,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7086/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,360,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7087/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,360,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7088/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,360,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7089/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,361,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7090/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,361,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7091/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,361,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7092/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,361,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7093/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,361,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7094/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,362,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7095/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,362,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7096/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,362,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7097/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,362,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7098/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,362,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7099/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,363,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7100/500000]
+ optim/total_grad_norm=1.133
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,363,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7101/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=1,363,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7102/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,363,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7103/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,363,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7104/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,363,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7105/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,364,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7106/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,364,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7107/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,364,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7108/500000]
+ train/ActionNoiseL2Loss=0.0126
+ throughput/total_tokens=1,364,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7109/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,364,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7110/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,365,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7111/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,365,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7112/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,365,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7113/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,365,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7114/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,365,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7115/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,366,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7116/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,366,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7117/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,366,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7118/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,366,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7119/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,366,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7120/500000]
+ optim/total_grad_norm=1.788
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,367,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7121/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,367,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7122/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,367,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7123/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,367,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7124/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,367,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7125/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,368,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7126/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,368,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7127/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,368,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7128/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,368,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7129/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,368,768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7130/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,368,960,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7131/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,369,152,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7132/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,369,344,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7133/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,369,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7134/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,369,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7135/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,369,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7136/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,370,112,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7137/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,370,304,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7138/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,370,496,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7139/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,370,688,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7140/500000]
+ optim/total_grad_norm=1.735
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,370,880,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7141/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,371,072,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7142/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,371,264,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7143/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,371,456,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7144/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,371,648,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7145/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,371,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7146/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,372,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7147/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,372,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7148/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,372,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7149/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,372,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7150/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,372,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7151/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,372,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7152/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,373,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7153/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,373,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7154/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,373,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7155/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,373,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7156/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,373,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7157/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,374,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7158/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,374,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7159/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,374,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7160/500000]
+ optim/total_grad_norm=1.134
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,374,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7161/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,374,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7162/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,375,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7163/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,375,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7164/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,375,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7165/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,375,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7166/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,375,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7167/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,376,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7168/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,376,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7169/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,376,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7170/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,376,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7171/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,376,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7172/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,377,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7173/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,377,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7174/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,377,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7175/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=1,377,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7176/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,377,792,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7177/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,377,984,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7178/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,378,176,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7179/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,378,368,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7180/500000]
+ optim/total_grad_norm=1.160
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,378,560,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7181/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,378,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7182/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,378,944,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7183/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,379,136,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7184/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,379,328,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7185/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,379,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7186/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=1,379,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7187/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,379,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7188/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,380,096,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7189/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,380,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7190/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,380,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7191/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,380,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7192/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,380,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7193/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,381,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7194/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,381,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7195/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,381,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7196/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,381,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7197/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,381,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7198/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,382,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7199/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,382,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7200/500000]
+ optim/total_grad_norm=2.427
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=1,382,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7201/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,382,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7202/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,382,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7203/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,382,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7204/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,383,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7205/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,383,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7206/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,383,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7207/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,383,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7208/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,383,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7209/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,384,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7210/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,384,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7211/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,384,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7212/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,384,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7213/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,384,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7214/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,385,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7215/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,385,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7216/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,385,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7217/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,385,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7218/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,385,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7219/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,386,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7220/500000]
+ optim/total_grad_norm=2.733
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,386,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7221/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,386,432,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7222/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,386,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7223/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,386,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7224/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,387,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7225/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,387,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7226/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,387,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7227/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,387,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7228/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,387,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7229/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,387,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7230/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,388,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7231/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,388,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7232/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,388,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7233/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,388,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7234/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,388,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7235/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,389,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7236/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,389,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7237/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,389,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7238/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,389,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7239/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,389,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7240/500000]
+ optim/total_grad_norm=1.470
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,390,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7241/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,390,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7242/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,390,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7243/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,390,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7244/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,390,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7245/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,391,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7246/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,391,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7247/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,391,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7248/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,391,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7249/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,391,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7250/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,392,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7251/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,392,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7252/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,392,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7253/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,392,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7254/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,392,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7255/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,392,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7256/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,393,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7257/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,393,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7258/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,393,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7259/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,393,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7260/500000]
+ optim/total_grad_norm=1.633
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,393,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7261/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,394,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7262/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,394,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7263/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,394,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7264/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,394,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7265/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,394,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7266/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,395,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7267/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,395,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7268/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,395,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7269/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,395,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7270/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,395,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7271/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,396,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7272/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,396,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7273/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,396,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7274/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,396,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7275/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,396,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7276/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,396,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7277/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,397,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7278/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,397,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7279/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,397,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7280/500000]
+ optim/total_grad_norm=1.265
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,397,760,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7281/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,397,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7282/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,398,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7283/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,398,336,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7284/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,398,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7285/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,398,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7286/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,398,912,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7287/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=1,399,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7288/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,399,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7289/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,399,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7290/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,399,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7291/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,399,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7292/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,400,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7293/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,400,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7294/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,400,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7295/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,400,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7296/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,400,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7297/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,401,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7298/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,401,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7299/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,401,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7300/500000]
+ optim/total_grad_norm=0.9408
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,401,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7301/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,401,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7302/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,401,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7303/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,402,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7304/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,402,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7305/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,402,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7306/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,402,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7307/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,402,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7308/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,403,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7309/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,403,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7310/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,403,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7311/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,403,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7312/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,403,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7313/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,404,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7314/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,404,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7315/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,404,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7316/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,404,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7317/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,404,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7318/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,405,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7319/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,405,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7320/500000]
+ optim/total_grad_norm=0.9189
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,405,440,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7321/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,405,632,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7322/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,405,824,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7323/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,406,016,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7324/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,406,208,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7325/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,406,400,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7326/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,406,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7327/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,406,784,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7328/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,406,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7329/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,407,168,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7330/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,407,360,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7331/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,407,552,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7332/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,407,744,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7333/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,407,936,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7334/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,408,128,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7335/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,408,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7336/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,408,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7337/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,408,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7338/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,408,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7339/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,409,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7340/500000]
+ optim/total_grad_norm=1.574
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,409,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7341/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,409,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7342/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,409,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7343/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,409,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7344/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,410,048,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7345/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,410,240,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7346/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,410,432,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7347/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,410,624,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7348/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,410,816,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7349/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,411,008,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7350/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,411,200,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7351/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,411,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7352/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,411,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7353/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,411,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7354/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,411,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7355/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,412,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7356/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,412,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7357/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,412,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7358/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,412,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7359/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,412,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7360/500000]
+ optim/total_grad_norm=0.8937
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,413,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7361/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,413,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7362/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,413,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7363/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,413,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7364/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,413,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7365/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,414,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7366/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,414,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7367/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,414,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7368/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,414,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7369/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,414,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7370/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,415,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7371/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,415,232,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7372/500000]
+ train/ActionNoiseL2Loss=0.0105
+ throughput/total_tokens=1,415,424,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7373/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,415,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7374/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,415,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7375/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,416,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7376/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,416,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7377/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,416,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7378/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,416,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7379/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,416,768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7380/500000]
+ optim/total_grad_norm=1.111
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,416,960,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7381/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,417,152,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7382/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,417,344,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7383/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,417,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7384/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,417,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7385/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,417,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7386/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,418,112,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7387/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,418,304,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7388/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,418,496,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7389/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,418,688,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7390/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,418,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7391/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,419,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7392/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,419,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7393/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,419,456,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7394/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,419,648,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7395/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,419,840,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7396/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,420,032,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7397/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,420,224,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7398/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,420,416,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7399/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,420,608,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7400/500000]
+ optim/total_grad_norm=0.9984
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,420,800,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7401/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,420,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7402/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,421,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7403/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,421,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7404/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=1,421,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7405/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,421,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7406/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,421,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7407/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,422,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7408/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,422,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7409/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,422,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7410/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,422,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7411/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,422,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7412/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,423,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7413/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,423,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7414/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,423,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7415/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,423,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7416/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,423,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7417/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,424,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7418/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,424,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7419/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,424,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7420/500000]
+ optim/total_grad_norm=1.266
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,424,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7421/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,424,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7422/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,425,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7423/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,425,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7424/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,425,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7425/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,425,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7426/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,425,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7427/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,425,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7428/500000]
+ train/ActionNoiseL2Loss=0.0100
+ throughput/total_tokens=1,426,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7429/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,426,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7430/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,426,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7431/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,426,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7432/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,426,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7433/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,427,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7434/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,427,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7435/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,427,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7436/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,427,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7437/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,427,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7438/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,428,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7439/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,428,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7440/500000]
+ optim/total_grad_norm=0.8559
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,428,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7441/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,428,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7442/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,428,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7443/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,429,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7444/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,429,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7445/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,429,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7446/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,429,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7447/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,429,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7448/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,430,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7449/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,430,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7450/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,430,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7451/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,430,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7452/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,430,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7453/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,430,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7454/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,431,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7455/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,431,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7456/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,431,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7457/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,431,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7458/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,431,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7459/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,432,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7460/500000]
+ optim/total_grad_norm=1.736
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,432,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7461/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,432,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7462/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,432,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7463/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,432,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7464/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,433,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7465/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,433,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7466/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,433,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7467/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=1,433,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7468/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,433,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7469/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,434,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7470/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,434,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7471/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,434,432,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7472/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,434,624,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7473/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,434,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7474/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,435,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7475/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=1,435,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7476/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,435,392,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7477/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,435,584,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7478/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,435,776,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7479/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,435,968,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7480/500000]
+ optim/total_grad_norm=1.413
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,436,160,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7481/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,436,352,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7482/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,436,544,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7483/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,436,736,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7484/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,436,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7485/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,437,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7486/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,437,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7487/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,437,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7488/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,437,696,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7489/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,437,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7490/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,438,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7491/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,438,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7492/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,438,464,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7493/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,438,656,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7494/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,438,848,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7495/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,439,040,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7496/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,439,232,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7497/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,439,424,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7498/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,439,616,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7499/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,439,808,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7500/500000]
+ optim/total_grad_norm=0.8145
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,440,000,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/04 [13:04:34] INFO | >> Saving config... checkpoint.py:608
+10/04 [13:05:20] INFO | >> Saving model state... checkpoint.py:796
+10/04 [13:06:32] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [13:08:03] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7501/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,440,192,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7502/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,440,384,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=7503/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,440,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=7504/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,440,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=7505/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,440,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=7506/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,441,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=7507/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,441,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=7508/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,441,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=7509/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,441,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=7510/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,441,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=7511/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,442,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=7512/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,442,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=7513/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,442,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7514/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,442,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7515/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,442,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7516/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,443,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7517/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,443,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7518/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,443,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7519/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,443,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7520/500000]
+ optim/total_grad_norm=1.589
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,443,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7521/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,444,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7522/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,444,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7523/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,444,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7524/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,444,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7525/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,444,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7526/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,444,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7527/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,445,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7528/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,445,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7529/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,445,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7530/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,445,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7531/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,445,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7532/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,446,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7533/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,446,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7534/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,446,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7535/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,446,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7536/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,446,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7537/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,447,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7538/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,447,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7539/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,447,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7540/500000]
+ optim/total_grad_norm=0.7295
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,447,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7541/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,447,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7542/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,448,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7543/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,448,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7544/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,448,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7545/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,448,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7546/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,448,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7547/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,449,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7548/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,449,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7549/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,449,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7550/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,449,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7551/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,449,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7552/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,449,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7553/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,450,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7554/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,450,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7555/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,450,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7556/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,450,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7557/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,450,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7558/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,451,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7559/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,451,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7560/500000]
+ optim/total_grad_norm=1.510
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,451,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7561/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,451,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7562/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,451,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7563/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,452,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7564/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,452,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7565/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,452,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7566/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,452,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7567/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,452,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7568/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,453,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7569/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,453,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7570/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,453,440,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7571/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,453,632,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7572/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,453,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7573/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,454,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7574/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,454,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7575/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,454,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7576/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,454,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7577/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,454,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7578/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,454,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7579/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,455,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7580/500000]
+ optim/total_grad_norm=0.8887
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,455,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7581/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,455,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7582/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,455,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7583/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,455,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7584/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,456,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7585/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,456,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7586/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,456,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7587/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,456,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7588/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,456,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7589/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,457,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7590/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,457,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7591/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,457,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7592/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,457,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7593/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,457,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7594/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,458,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7595/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,458,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7596/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,458,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7597/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,458,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7598/500000]
+ train/ActionNoiseL2Loss=0.0126
+ throughput/total_tokens=1,458,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7599/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,459,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7600/500000]
+ optim/total_grad_norm=1.202
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,459,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7601/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,459,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7602/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,459,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7603/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,459,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7604/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,459,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7605/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,460,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7606/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,460,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7607/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,460,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7608/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,460,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7609/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,460,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7610/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,461,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7611/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=1,461,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7612/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,461,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7613/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,461,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7614/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,461,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7615/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,462,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7616/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,462,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7617/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,462,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7618/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,462,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7619/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=1,462,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7620/500000]
+ optim/total_grad_norm=1.306
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,463,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7621/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,463,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7622/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,463,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7623/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,463,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7624/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,463,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7625/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,464,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7626/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,464,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7627/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,464,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7628/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,464,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7629/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,464,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7630/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,464,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7631/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,465,152,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7632/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,465,344,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7633/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,465,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7634/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,465,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7635/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,465,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7636/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,466,112,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7637/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,466,304,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7638/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,466,496,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7639/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=1,466,688,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7640/500000]
+ optim/total_grad_norm=1.478
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,466,880,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7641/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,467,072,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7642/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,467,264,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7643/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,467,456,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7644/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,467,648,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7645/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,467,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7646/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,468,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7647/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,468,224,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7648/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,468,416,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7649/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,468,608,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7650/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,468,800,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7651/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,468,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7652/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,469,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7653/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,469,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7654/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,469,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7655/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,469,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7656/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,469,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7657/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,470,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7658/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,470,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7659/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,470,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7660/500000]
+ optim/total_grad_norm=0.7664
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,470,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7661/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,470,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7662/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,471,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7663/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,471,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7664/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,471,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7665/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,471,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7666/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,471,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7667/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,472,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7668/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,472,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7669/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,472,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7670/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,472,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7671/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,472,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7672/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,473,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7673/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,473,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7674/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,473,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7675/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,473,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7676/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,473,792,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7677/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,473,984,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7678/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,474,176,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7679/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,474,368,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7680/500000]
+ optim/total_grad_norm=1.331
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,474,560,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7681/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,474,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7682/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,474,944,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7683/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,475,136,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7684/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,475,328,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7685/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,475,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7686/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,475,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7687/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,475,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7688/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,476,096,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7689/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,476,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7690/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,476,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7691/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,476,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7692/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,476,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7693/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,477,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7694/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,477,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7695/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,477,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7696/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,477,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7697/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,477,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7698/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,478,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7699/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,478,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7700/500000]
+ optim/total_grad_norm=1.682
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,478,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7701/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,478,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7702/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,478,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7703/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,478,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7704/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,479,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7705/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,479,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7706/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,479,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7707/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,479,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7708/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,479,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7709/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,480,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7710/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,480,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7711/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,480,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7712/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,480,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7713/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,480,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7714/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,481,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7715/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,481,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7716/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,481,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7717/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,481,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7718/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,481,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7719/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,482,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7720/500000]
+ optim/total_grad_norm=1.151
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,482,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7721/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,482,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7722/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,482,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7723/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,482,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7724/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,483,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7725/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,483,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7726/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,483,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7727/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,483,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7728/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,483,776,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7729/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,483,968,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7730/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,484,160,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7731/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,484,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7732/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,484,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7733/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,484,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7734/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,484,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7735/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,485,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7736/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,485,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7737/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,485,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7738/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,485,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7739/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,485,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7740/500000]
+ optim/total_grad_norm=1.104
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,486,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7741/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,486,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7742/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,486,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7743/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,486,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7744/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,486,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7745/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,487,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7746/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,487,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7747/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,487,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7748/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,487,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7749/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,487,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7750/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,488,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7751/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,488,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7752/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,488,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7753/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,488,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7754/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,488,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7755/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,488,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7756/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,489,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7757/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,489,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7758/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,489,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7759/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,489,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7760/500000]
+ optim/total_grad_norm=0.6808
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,489,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7761/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,490,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7762/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,490,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7763/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,490,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7764/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,490,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7765/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,490,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7766/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,491,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7767/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,491,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7768/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,491,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7769/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,491,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7770/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,491,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7771/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,492,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7772/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,492,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7773/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,492,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7774/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,492,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7775/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,492,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7776/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,492,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7777/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,493,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7778/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,493,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7779/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,493,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7780/500000]
+ optim/total_grad_norm=1.200
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,493,760,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7781/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,493,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7782/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,494,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7783/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,494,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7784/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,494,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7785/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,494,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7786/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,494,912,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7787/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=1,495,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7788/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,495,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7789/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,495,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7790/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,495,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7791/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,495,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7792/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,496,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7793/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,496,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7794/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,496,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7795/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,496,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7796/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,496,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7797/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,497,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7798/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,497,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7799/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,497,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7800/500000]
+ optim/total_grad_norm=1.081
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,497,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7801/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,497,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7802/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,497,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7803/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,498,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7804/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,498,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7805/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,498,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7806/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,498,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7807/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,498,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7808/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,499,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7809/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,499,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7810/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,499,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7811/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,499,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7812/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,499,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7813/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,500,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7814/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,500,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7815/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,500,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7816/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,500,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7817/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,500,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7818/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,501,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7819/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,501,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7820/500000]
+ optim/total_grad_norm=0.7672
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,501,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7821/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=1,501,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7822/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,501,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7823/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,502,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7824/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,502,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7825/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,502,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7826/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,502,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7827/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,502,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7828/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,502,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7829/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,503,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7830/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,503,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7831/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,503,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7832/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,503,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7833/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,503,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7834/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,504,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7835/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,504,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7836/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,504,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7837/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,504,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7838/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,504,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7839/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,505,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7840/500000]
+ optim/total_grad_norm=0.6380
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,505,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7841/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,505,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7842/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,505,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7843/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,505,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7844/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,506,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7845/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,506,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7846/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,506,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7847/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,506,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7848/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,506,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7849/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,507,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7850/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,507,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7851/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,507,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7852/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,507,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7853/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=1,507,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7854/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,507,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7855/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,508,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7856/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,508,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7857/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,508,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7858/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,508,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7859/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,508,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7860/500000]
+ optim/total_grad_norm=1.680
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=1,509,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7861/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,509,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7862/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,509,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7863/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,509,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7864/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,509,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7865/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,510,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7866/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,510,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7867/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,510,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7868/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,510,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7869/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,510,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7870/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,511,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7871/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,511,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7872/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,511,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7873/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,511,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7874/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,511,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7875/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,512,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7876/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,512,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7877/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,512,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7878/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,512,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7879/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,512,768,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7880/500000]
+ optim/total_grad_norm=0.8482
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=1,512,960,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7881/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,513,152,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7882/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,513,344,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7883/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,513,536,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7884/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,513,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7885/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,513,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7886/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,514,112,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7887/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,514,304,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7888/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,514,496,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7889/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,514,688,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7890/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,514,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7891/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,515,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7892/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,515,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7893/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,515,456,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7894/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,515,648,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7895/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,515,840,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7896/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,516,032,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7897/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,516,224,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7898/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,516,416,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7899/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,516,608,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7900/500000]
+ optim/total_grad_norm=1.279
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,516,800,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7901/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,516,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7902/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,517,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7903/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,517,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7904/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,517,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7905/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,517,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7906/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,517,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7907/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,518,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7908/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,518,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7909/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,518,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7910/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,518,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7911/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,518,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7912/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,519,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7913/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,519,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7914/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,519,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7915/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,519,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7916/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,519,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7917/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=1,520,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7918/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,520,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7919/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,520,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7920/500000]
+ optim/total_grad_norm=1.045
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,520,640,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=7921/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,520,832,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7922/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,521,024,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7923/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,521,216,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7924/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,521,408,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7925/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,521,600,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7926/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=1,521,792,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7927/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,521,984,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7928/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,522,176,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7929/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,522,368,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7930/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,522,560,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7931/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,522,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7932/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,522,944,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7933/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,523,136,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7934/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,523,328,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7935/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,523,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7936/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,523,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7937/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,523,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7938/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,524,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=7939/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,524,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7940/500000]
+ optim/total_grad_norm=1.114
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,524,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7941/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,524,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7942/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,524,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7943/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=1,525,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7944/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,525,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7945/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,525,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7946/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,525,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7947/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,525,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7948/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,526,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7949/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,526,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7950/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,526,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7951/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,526,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7952/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,526,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7953/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,526,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7954/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,527,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7955/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,527,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7956/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,527,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7957/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,527,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7958/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,527,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7959/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,528,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7960/500000]
+ optim/total_grad_norm=1.220
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,528,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=7961/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,528,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7962/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,528,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7963/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,528,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7964/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,529,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7965/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,529,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7966/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,529,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7967/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,529,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7968/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,529,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7969/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,530,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7970/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,530,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7971/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,530,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7972/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,530,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7973/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,530,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7974/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,531,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7975/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,531,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7976/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,531,392,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7977/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,531,584,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7978/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,531,776,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7979/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,531,968,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7980/500000]
+ optim/total_grad_norm=1.471
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,532,160,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7981/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,532,352,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7982/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,532,544,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7983/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,532,736,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7984/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,532,928,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7985/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,533,120,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7986/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,533,312,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=7987/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,533,504,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7988/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,533,696,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7989/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,533,888,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7990/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,534,080,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=7991/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,534,272,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=7992/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,534,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7993/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,534,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7994/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,534,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7995/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,535,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7996/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,535,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7997/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=1,535,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7998/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,535,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=7999/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,535,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8000/500000]
+ optim/total_grad_norm=1.064
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,536,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/04 [16:02:50] INFO | >> Saving config... checkpoint.py:608
+10/04 [16:03:36] INFO | >> Saving model state... checkpoint.py:796
+10/04 [16:04:48] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [16:06:19] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8001/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,536,192,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8002/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,536,384,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=8003/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,536,576,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=8004/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,536,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8005/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,536,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=8006/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,537,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8007/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,537,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=8008/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,537,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8009/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,537,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8010/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,537,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8011/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,538,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8012/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,538,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8013/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,538,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8014/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,538,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8015/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,538,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8016/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,539,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8017/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,539,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8018/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,539,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8019/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,539,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8020/500000]
+ optim/total_grad_norm=2.465
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=1,539,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8021/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,540,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8022/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,540,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8023/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,540,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8024/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,540,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8025/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,540,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8026/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,540,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8027/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,541,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8028/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,541,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8029/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,541,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8030/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,541,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8031/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,541,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8032/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,542,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8033/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,542,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8034/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,542,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8035/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,542,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8036/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,542,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8037/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,543,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8038/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,543,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8039/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,543,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8040/500000]
+ optim/total_grad_norm=1.225
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,543,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8041/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,543,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8042/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,544,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8043/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,544,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8044/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,544,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8045/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,544,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8046/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,544,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8047/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,545,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8048/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,545,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8049/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,545,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8050/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,545,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8051/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,545,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8052/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,545,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8053/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,546,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8054/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,546,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8055/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,546,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8056/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,546,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8057/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,546,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8058/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,547,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8059/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,547,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8060/500000]
+ optim/total_grad_norm=1.727
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,547,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8061/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,547,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8062/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,547,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8063/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,548,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8064/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,548,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8065/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,548,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8066/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,548,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8067/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,548,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8068/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,549,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8069/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,549,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8070/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,549,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8071/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,549,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8072/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,549,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8073/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,550,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8074/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,550,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8075/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,550,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8076/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,550,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8077/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,550,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8078/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,550,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8079/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,551,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8080/500000]
+ optim/total_grad_norm=1.297
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,551,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8081/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,551,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8082/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=1,551,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8083/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,551,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8084/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,552,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8085/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,552,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8086/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,552,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8087/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,552,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8088/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,552,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8089/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,553,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8090/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,553,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8091/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,553,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8092/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,553,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8093/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,553,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8094/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,554,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8095/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,554,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8096/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,554,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8097/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,554,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8098/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,554,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8099/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,555,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8100/500000]
+ optim/total_grad_norm=0.9016
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,555,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8101/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,555,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8102/500000]
+ train/ActionNoiseL2Loss=0.0095
+ throughput/total_tokens=1,555,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8103/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,555,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8104/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,555,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8105/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,556,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8106/500000]
+ train/ActionNoiseL2Loss=0.0110
+ throughput/total_tokens=1,556,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8107/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,556,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8108/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,556,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8109/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,556,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8110/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,557,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8111/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,557,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8112/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,557,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8113/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,557,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8114/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,557,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8115/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,558,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8116/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,558,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8117/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,558,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8118/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,558,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8119/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,558,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8120/500000]
+ optim/total_grad_norm=0.7568
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,559,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8121/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,559,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8122/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,559,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8123/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,559,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8124/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,559,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8125/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,560,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8126/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,560,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8127/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,560,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8128/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,560,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8129/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,560,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8130/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,560,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8131/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=1,561,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8132/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,561,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8133/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,561,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8134/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,561,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8135/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,561,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8136/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,562,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8137/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,562,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8138/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,562,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8139/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,562,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8140/500000]
+ optim/total_grad_norm=0.7722
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,562,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8141/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,563,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8142/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,563,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8143/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,563,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8144/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,563,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8145/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,563,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8146/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,564,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8147/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,564,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8148/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,564,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8149/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,564,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8150/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,564,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8151/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,564,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8152/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,565,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8153/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,565,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8154/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,565,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8155/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,565,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8156/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,565,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8157/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,566,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8158/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,566,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8159/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,566,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8160/500000]
+ optim/total_grad_norm=1.465
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,566,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8161/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,566,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8162/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,567,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8163/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,567,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8164/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,567,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8165/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,567,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8166/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,567,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8167/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,568,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8168/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,568,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8169/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,568,448,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8170/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,568,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8171/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,568,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8172/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,569,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8173/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=1,569,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8174/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,569,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8175/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,569,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8176/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,569,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8177/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,569,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8178/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,570,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8179/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,570,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8180/500000]
+ optim/total_grad_norm=1.507
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,570,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8181/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,570,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8182/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,570,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8183/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,571,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8184/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=1,571,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8185/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,571,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8186/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,571,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8187/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,571,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8188/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,572,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8189/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,572,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8190/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,572,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8191/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,572,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8192/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,572,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8193/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,573,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8194/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,573,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8195/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,573,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8196/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,573,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8197/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,573,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8198/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,574,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8199/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,574,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8200/500000]
+ optim/total_grad_norm=0.8295
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,574,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8201/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,574,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8202/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,574,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8203/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,574,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8204/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=1,575,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8205/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,575,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8206/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,575,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8207/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,575,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8208/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,575,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8209/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,576,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8210/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,576,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8211/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,576,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8212/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,576,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8213/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,576,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8214/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,577,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8215/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,577,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8216/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,577,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8217/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,577,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8218/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,577,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8219/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,578,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8220/500000]
+ optim/total_grad_norm=0.7799
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,578,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8221/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,578,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8222/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,578,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8223/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,578,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8224/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,579,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8225/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,579,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8226/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,579,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8227/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,579,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8228/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,579,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8229/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,579,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8230/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,580,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8231/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,580,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8232/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,580,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8233/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,580,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8234/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,580,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8235/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,581,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8236/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,581,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8237/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=1,581,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8238/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,581,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8239/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,581,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8240/500000]
+ optim/total_grad_norm=1.195
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,582,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8241/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,582,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8242/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,582,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8243/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,582,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8244/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,582,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8245/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,583,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8246/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,583,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8247/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,583,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8248/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,583,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8249/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,583,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8250/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=1,584,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8251/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,584,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8252/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,584,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8253/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,584,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8254/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,584,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8255/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,584,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8256/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,585,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8257/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,585,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8258/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,585,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8259/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,585,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8260/500000]
+ optim/total_grad_norm=1.280
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,585,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8261/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,586,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8262/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,586,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8263/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,586,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8264/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,586,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8265/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,586,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8266/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,587,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8267/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,587,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8268/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,587,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8269/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,587,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8270/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,587,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8271/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,588,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8272/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,588,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8273/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,588,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8274/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,588,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8275/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,588,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8276/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,588,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8277/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,589,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8278/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,589,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8279/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,589,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8280/500000]
+ optim/total_grad_norm=0.9150
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,589,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8281/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,589,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8282/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,590,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8283/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,590,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8284/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,590,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8285/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,590,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8286/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,590,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8287/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,591,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8288/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,591,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8289/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,591,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8290/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=1,591,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8291/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,591,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8292/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,592,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8293/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,592,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8294/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,592,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8295/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,592,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8296/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,592,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8297/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,593,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8298/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,593,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8299/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,593,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8300/500000]
+ optim/total_grad_norm=1.221
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,593,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8301/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,593,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8302/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,593,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8303/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,594,176,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8304/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,594,368,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8305/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,594,560,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8306/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,594,752,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8307/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,594,944,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8308/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,595,136,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8309/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,595,328,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8310/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,595,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8311/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,595,712,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8312/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,595,904,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8313/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,596,096,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8314/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,596,288,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8315/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,596,480,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8316/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,596,672,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8317/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,596,864,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8318/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,597,056,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8319/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,597,248,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8320/500000]
+ optim/total_grad_norm=1.896
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,597,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8321/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,597,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8322/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,597,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8323/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,598,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8324/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,598,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8325/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,598,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8326/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,598,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8327/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,598,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8328/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,598,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8329/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,599,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8330/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,599,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8331/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,599,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8332/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,599,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8333/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,599,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8334/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,600,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8335/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,600,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8336/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,600,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8337/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,600,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8338/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,600,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8339/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,601,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8340/500000]
+ optim/total_grad_norm=1.096
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,601,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8341/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,601,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8342/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,601,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8343/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,601,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8344/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,602,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8345/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=1,602,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8346/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,602,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8347/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,602,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8348/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,602,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8349/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,603,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8350/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,603,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8351/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,603,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8352/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,603,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8353/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,603,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8354/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,603,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8355/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,604,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8356/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,604,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8357/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,604,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8358/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,604,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8359/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,604,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8360/500000]
+ optim/total_grad_norm=1.138
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,605,120,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8361/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,605,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8362/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,605,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8363/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,605,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8364/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,605,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8365/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,606,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8366/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,606,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8367/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,606,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8368/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,606,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8369/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,606,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8370/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,607,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8371/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,607,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8372/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,607,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8373/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,607,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8374/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,607,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8375/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,608,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8376/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,608,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8377/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,608,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8378/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,608,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8379/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,608,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8380/500000]
+ optim/total_grad_norm=1.308
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,608,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8381/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,609,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8382/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,609,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8383/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,609,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8384/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,609,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8385/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,609,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8386/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,610,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8387/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,610,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8388/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,610,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8389/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,610,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8390/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=1,610,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8391/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,611,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8392/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,611,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8393/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,611,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8394/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,611,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8395/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,611,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8396/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=1,612,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8397/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,612,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8398/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,612,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8399/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,612,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8400/500000]
+ optim/total_grad_norm=1.803
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,612,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8401/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,612,992,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8402/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,613,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8403/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,613,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8404/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,613,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8405/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,613,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8406/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,613,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8407/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,614,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8408/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,614,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8409/500000]
+ train/ActionNoiseL2Loss=0.1379
+ throughput/total_tokens=1,614,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8410/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,614,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8411/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,614,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8412/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,615,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8413/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,615,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8414/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,615,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8415/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,615,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8416/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,615,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8417/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,616,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8418/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,616,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8419/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,616,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8420/500000]
+ optim/total_grad_norm=1.020
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,616,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8421/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,616,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8422/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,617,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8423/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,617,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8424/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,617,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8425/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,617,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8426/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,617,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8427/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,617,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8428/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,618,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8429/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,618,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8430/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,618,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8431/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,618,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8432/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,618,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8433/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,619,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8434/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,619,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8435/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,619,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8436/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,619,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8437/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,619,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8438/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,620,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8439/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,620,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8440/500000]
+ optim/total_grad_norm=1.081
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,620,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8441/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,620,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8442/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,620,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8443/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,621,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8444/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,621,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8445/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,621,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8446/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,621,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8447/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,621,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8448/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,622,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8449/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,622,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8450/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,622,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8451/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,622,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8452/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,622,784,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8453/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,622,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8454/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,623,168,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8455/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,623,360,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8456/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,623,552,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8457/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,623,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8458/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,623,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8459/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,624,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8460/500000]
+ optim/total_grad_norm=1.144
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,624,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8461/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,624,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8462/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,624,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8463/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,624,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8464/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,625,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8465/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,625,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8466/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,625,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8467/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,625,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8468/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,625,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8469/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,626,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8470/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,626,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8471/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,626,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8472/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,626,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8473/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,626,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8474/500000]
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=1,627,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8475/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,627,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8476/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,627,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8477/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,627,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8478/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,627,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8479/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,627,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8480/500000]
+ optim/total_grad_norm=1.041
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,628,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8481/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,628,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8482/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,628,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8483/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,628,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8484/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,628,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8485/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,629,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8486/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,629,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8487/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,629,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8488/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,629,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8489/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,629,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8490/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,630,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8491/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,630,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8492/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,630,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8493/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,630,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8494/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,630,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8495/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,631,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8496/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,631,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8497/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,631,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8498/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,631,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8499/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,631,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8500/500000]
+ optim/total_grad_norm=1.164
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,632,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+10/04 [19:01:09] INFO | >> Saving config... checkpoint.py:608
+10/04 [19:01:43] INFO | >> Saving model state... checkpoint.py:796
+10/04 [19:02:55] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [19:04:28] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8501/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,632,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8502/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,632,384,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=8503/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,632,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=8504/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,632,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=8505/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,632,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8506/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,633,152,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8507/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,633,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=8508/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,633,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8509/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,633,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8510/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,633,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8511/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,634,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8512/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,634,304,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8513/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,634,496,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8514/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,634,688,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=8515/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,634,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8516/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,635,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8517/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,635,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8518/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,635,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8519/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,635,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8520/500000]
+ optim/total_grad_norm=1.100
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,635,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8521/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,636,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8522/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,636,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8523/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,636,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8524/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,636,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8525/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=1,636,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8526/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,636,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8527/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,637,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8528/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,637,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8529/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,637,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8530/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,637,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8531/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,637,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8532/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,638,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8533/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,638,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8534/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,638,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8535/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,638,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8536/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,638,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8537/500000]
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=1,639,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8538/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,639,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8539/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,639,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8540/500000]
+ optim/total_grad_norm=0.8592
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,639,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8541/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,639,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8542/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,640,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8543/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,640,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8544/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,640,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8545/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,640,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8546/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,640,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8547/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,641,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8548/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=1,641,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8549/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,641,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8550/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,641,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8551/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,641,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8552/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,641,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8553/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=1,642,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8554/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,642,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8555/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,642,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8556/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,642,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8557/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,642,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8558/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,643,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8559/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,643,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8560/500000]
+ optim/total_grad_norm=0.7947
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,643,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8561/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,643,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8562/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,643,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8563/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,644,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8564/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,644,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8565/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,644,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8566/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,644,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8567/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,644,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8568/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,645,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8569/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,645,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8570/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,645,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8571/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,645,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8572/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,645,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8573/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,646,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8574/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,646,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8575/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,646,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8576/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,646,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8577/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,646,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8578/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,646,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8579/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,647,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8580/500000]
+ optim/total_grad_norm=0.8450
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,647,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8581/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,647,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8582/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,647,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8583/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,647,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8584/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,648,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8585/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,648,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8586/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,648,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8587/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,648,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8588/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,648,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8589/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,649,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8590/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,649,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8591/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,649,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8592/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,649,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8593/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,649,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8594/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,650,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8595/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,650,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8596/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,650,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8597/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,650,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8598/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,650,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8599/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,651,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8600/500000]
+ optim/total_grad_norm=2.113
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,651,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8601/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,651,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8602/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,651,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8603/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,651,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8604/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,651,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8605/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,652,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8606/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,652,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8607/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,652,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8608/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,652,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8609/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,652,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8610/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,653,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8611/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,653,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8612/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,653,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8613/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,653,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8614/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,653,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8615/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=1,654,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8616/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,654,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8617/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,654,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8618/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,654,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8619/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,654,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8620/500000]
+ optim/total_grad_norm=1.259
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,655,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8621/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,655,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8622/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,655,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8623/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,655,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8624/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,655,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8625/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,656,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8626/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,656,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8627/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,656,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8628/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,656,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8629/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,656,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8630/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,656,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8631/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,657,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8632/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,657,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8633/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,657,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8634/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,657,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8635/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,657,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8636/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,658,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8637/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,658,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8638/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,658,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8639/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,658,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8640/500000]
+ optim/total_grad_norm=0.9382
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,658,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8641/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,659,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8642/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,659,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8643/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,659,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8644/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,659,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8645/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=1,659,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8646/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,660,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8647/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,660,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8648/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,660,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8649/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,660,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8650/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,660,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8651/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,660,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8652/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,661,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8653/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,661,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8654/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,661,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8655/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,661,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8656/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,661,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8657/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,662,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8658/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,662,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8659/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,662,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8660/500000]
+ optim/total_grad_norm=1.167
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,662,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8661/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,662,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8662/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,663,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8663/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,663,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8664/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,663,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8665/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,663,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8666/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,663,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8667/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,664,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8668/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,664,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8669/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,664,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8670/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,664,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8671/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,664,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8672/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,665,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8673/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,665,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8674/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,665,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8675/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,665,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8676/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,665,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8677/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,665,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8678/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,666,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8679/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,666,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8680/500000]
+ optim/total_grad_norm=1.189
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,666,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8681/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,666,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8682/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,666,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8683/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,667,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8684/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,667,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8685/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,667,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8686/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,667,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8687/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,667,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8688/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,668,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8689/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,668,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8690/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,668,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8691/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,668,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8692/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,668,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8693/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,669,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8694/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,669,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8695/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,669,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8696/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,669,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8697/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,669,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8698/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=1,670,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8699/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,670,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8700/500000]
+ optim/total_grad_norm=1.865
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,670,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8701/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,670,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8702/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,670,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8703/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,670,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8704/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,671,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8705/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,671,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8706/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,671,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8707/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,671,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8708/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,671,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8709/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,672,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8710/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,672,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8711/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,672,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8712/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,672,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8713/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,672,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8714/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,673,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8715/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,673,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8716/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,673,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8717/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,673,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8718/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,673,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8719/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,674,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8720/500000]
+ optim/total_grad_norm=1.254
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,674,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8721/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,674,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=8722/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,674,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8723/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,674,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8724/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,675,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8725/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,675,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8726/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,675,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8727/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,675,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8728/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,675,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8729/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,675,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8730/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,676,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8731/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,676,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8732/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,676,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8733/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,676,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8734/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,676,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8735/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,677,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8736/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,677,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8737/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,677,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8738/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,677,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8739/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,677,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8740/500000]
+ optim/total_grad_norm=1.462
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,678,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8741/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,678,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8742/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,678,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8743/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,678,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8744/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,678,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8745/500000]
+ train/ActionNoiseL2Loss=0.0092
+ throughput/total_tokens=1,679,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8746/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,679,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8747/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,679,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8748/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,679,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8749/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,679,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8750/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,680,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8751/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,680,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8752/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,680,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8753/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,680,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8754/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,680,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8755/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,680,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8756/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,681,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8757/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,681,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8758/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,681,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8759/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,681,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8760/500000]
+ optim/total_grad_norm=0.8301
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,681,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8761/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,682,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8762/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,682,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8763/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=1,682,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8764/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,682,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8765/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,682,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8766/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,683,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8767/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,683,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8768/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,683,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8769/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,683,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8770/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,683,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8771/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,684,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8772/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,684,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8773/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,684,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8774/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,684,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8775/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,684,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8776/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,684,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8777/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,685,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8778/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,685,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8779/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,685,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8780/500000]
+ optim/total_grad_norm=0.8449
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,685,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8781/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,685,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8782/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,686,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8783/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,686,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8784/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,686,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8785/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,686,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8786/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,686,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8787/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,687,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8788/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,687,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8789/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,687,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8790/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,687,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8791/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,687,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8792/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,688,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8793/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,688,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8794/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,688,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8795/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,688,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8796/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,688,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8797/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,689,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8798/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,689,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8799/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,689,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8800/500000]
+ optim/total_grad_norm=1.267
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,689,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8801/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,689,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8802/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,689,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8803/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,690,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8804/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,690,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8805/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,690,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8806/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,690,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8807/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,690,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8808/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,691,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8809/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,691,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8810/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,691,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8811/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,691,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8812/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=1,691,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8813/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,692,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8814/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=1,692,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8815/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,692,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8816/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,692,672,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8817/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,692,864,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8818/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,693,056,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8819/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,693,248,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8820/500000]
+ optim/total_grad_norm=1.430
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,693,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8821/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,693,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8822/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,693,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8823/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,694,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8824/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,694,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8825/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,694,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8826/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,694,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8827/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,694,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8828/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,694,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8829/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,695,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8830/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,695,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8831/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,695,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8832/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=1,695,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8833/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,695,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8834/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,696,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8835/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=1,696,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8836/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,696,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8837/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,696,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8838/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=1,696,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8839/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,697,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8840/500000]
+ optim/total_grad_norm=0.9043
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,697,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8841/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,697,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8842/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,697,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8843/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,697,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8844/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,698,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8845/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,698,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8846/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,698,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8847/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,698,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8848/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,698,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8849/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,699,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8850/500000]
+ train/ActionNoiseL2Loss=0.0118
+ throughput/total_tokens=1,699,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8851/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,699,392,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8852/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,699,584,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8853/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,699,776,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8854/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,699,968,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8855/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,700,160,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8856/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,700,352,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8857/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,700,544,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8858/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,700,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8859/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,700,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8860/500000]
+ optim/total_grad_norm=0.7246
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,701,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8861/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=1,701,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8862/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,701,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8863/500000]
+ train/ActionNoiseL2Loss=0.0101
+ throughput/total_tokens=1,701,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8864/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,701,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8865/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,702,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8866/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=1,702,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8867/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,702,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8868/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,702,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8869/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,702,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8870/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,703,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8871/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,703,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8872/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,703,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8873/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,703,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8874/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,703,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8875/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,704,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8876/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,704,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8877/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,704,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8878/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,704,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8879/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,704,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8880/500000]
+ optim/total_grad_norm=1.522
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,704,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8881/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,705,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8882/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,705,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8883/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,705,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8884/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,705,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8885/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,705,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8886/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,706,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8887/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,706,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8888/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,706,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8889/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,706,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8890/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,706,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8891/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,707,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8892/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,707,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8893/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,707,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8894/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,707,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8895/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,707,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8896/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,708,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8897/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,708,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8898/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,708,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8899/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,708,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8900/500000]
+ optim/total_grad_norm=1.426
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,708,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8901/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,708,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8902/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,709,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8903/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,709,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8904/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,709,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8905/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,709,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8906/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,709,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8907/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,710,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8908/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,710,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8909/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,710,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8910/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,710,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=8911/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,710,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8912/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,711,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8913/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,711,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8914/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,711,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8915/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,711,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8916/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,711,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8917/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,712,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8918/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,712,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8919/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,712,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8920/500000]
+ optim/total_grad_norm=0.7451
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,712,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8921/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,712,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8922/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,713,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8923/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,713,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8924/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,713,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8925/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,713,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8926/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,713,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8927/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,713,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8928/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,714,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8929/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,714,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8930/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,714,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8931/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,714,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8932/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,714,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8933/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,715,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8934/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,715,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8935/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,715,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8936/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,715,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8937/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,715,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8938/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,716,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8939/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,716,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8940/500000]
+ optim/total_grad_norm=1.090
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,716,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8941/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,716,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8942/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,716,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8943/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=1,717,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8944/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,717,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8945/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,717,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8946/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,717,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8947/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=1,717,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8948/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,718,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8949/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,718,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8950/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,718,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8951/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,718,592,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8952/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,718,784,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8953/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,718,976,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8954/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,719,168,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8955/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,719,360,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8956/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,719,552,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8957/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,719,744,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8958/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,719,936,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8959/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,720,128,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8960/500000]
+ optim/total_grad_norm=1.042
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,720,320,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+ System/Peak GPU Memory (MB)=46,467
+[step=8961/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,720,512,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=8962/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,720,704,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8963/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,720,896,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8964/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,721,088,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8965/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,721,280,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8966/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,721,472,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=8967/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,721,664,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8968/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,721,856,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8969/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,722,048,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=8970/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,722,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=8971/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,722,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8972/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,722,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8973/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,722,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8974/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,723,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8975/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,723,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8976/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,723,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8977/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,723,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8978/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,723,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8979/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,723,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8980/500000]
+ optim/total_grad_norm=1.198
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,724,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8981/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,724,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8982/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,724,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8983/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=1,724,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8984/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,724,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8985/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,725,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8986/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,725,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8987/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,725,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8988/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,725,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8989/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,725,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8990/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,726,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=8991/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,726,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8992/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,726,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8993/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,726,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8994/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,726,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8995/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,727,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8996/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,727,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8997/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,727,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8998/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,727,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=8999/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,727,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9000/500000]
+ optim/total_grad_norm=1.064
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,728,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+10/04 [21:58:59] INFO | >> Saving config... checkpoint.py:608
+10/04 [21:59:50] INFO | >> Saving model state... checkpoint.py:796
+10/04 [22:01:01] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [22:02:33] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9001/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,728,192,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=9002/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=1,728,384,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=9003/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,728,576,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9004/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,728,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9005/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,728,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=9006/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,729,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9007/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,729,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9008/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,729,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9009/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,729,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9010/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,729,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9011/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,730,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9012/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,730,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9013/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=1,730,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9014/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,730,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9015/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,730,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9016/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,731,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9017/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,731,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9018/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,731,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9019/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,731,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9020/500000]
+ optim/total_grad_norm=1.235
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,731,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9021/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,732,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9022/500000]
+ train/ActionNoiseL2Loss=0.0108
+ throughput/total_tokens=1,732,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9023/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,732,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9024/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,732,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9025/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,732,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9026/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,732,992,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9027/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,733,184,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9028/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,733,376,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9029/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,733,568,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9030/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,733,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9031/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,733,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9032/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,734,144,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9033/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,734,336,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9034/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,734,528,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9035/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,734,720,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9036/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,734,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9037/500000]
+ train/ActionNoiseL2Loss=0.0090
+ throughput/total_tokens=1,735,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9038/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,735,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9039/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,735,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9040/500000]
+ optim/total_grad_norm=0.4973
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,735,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9041/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,735,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9042/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,736,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9043/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,736,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9044/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,736,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9045/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,736,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9046/500000]
+ train/ActionNoiseL2Loss=0.0118
+ throughput/total_tokens=1,736,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9047/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,737,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9048/500000]
+ train/ActionNoiseL2Loss=0.0107
+ throughput/total_tokens=1,737,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9049/500000]
+ train/ActionNoiseL2Loss=0.0106
+ throughput/total_tokens=1,737,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9050/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,737,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9051/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,737,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9052/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,737,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9053/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,738,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9054/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,738,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9055/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,738,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9056/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,738,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9057/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,738,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9058/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,739,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9059/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,739,328,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9060/500000]
+ optim/total_grad_norm=1.289
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,739,520,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9061/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,739,712,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9062/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,739,904,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9063/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,740,096,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9064/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,740,288,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9065/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,740,480,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9066/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,740,672,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9067/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,740,864,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9068/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,741,056,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9069/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,741,248,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9070/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,741,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9071/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,741,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9072/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,741,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9073/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,742,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9074/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,742,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9075/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,742,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9076/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,742,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9077/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,742,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9078/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,742,976,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9079/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,743,168,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9080/500000]
+ optim/total_grad_norm=0.7879
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,743,360,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9081/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,743,552,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9082/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,743,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9083/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,743,936,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9084/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=1,744,128,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9085/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,744,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9086/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,744,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9087/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=1,744,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9088/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,744,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9089/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,745,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9090/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,745,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9091/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,745,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9092/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,745,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9093/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,745,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9094/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,746,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9095/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,746,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9096/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=1,746,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9097/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,746,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9098/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,746,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9099/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,747,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9100/500000]
+ optim/total_grad_norm=0.7902
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,747,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9101/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,747,392,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9102/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,747,584,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9103/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,747,776,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9104/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,747,968,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9105/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,748,160,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9106/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,748,352,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9107/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,748,544,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9108/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,748,736,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9109/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,748,928,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9110/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,749,120,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9111/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,749,312,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9112/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,749,504,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9113/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,749,696,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9114/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,749,888,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9115/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,750,080,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9116/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,750,272,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9117/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,750,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9118/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,750,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9119/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,750,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9120/500000]
+ optim/total_grad_norm=1.059
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,751,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9121/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,751,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9122/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,751,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9123/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,751,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9124/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,751,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9125/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,752,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9126/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,752,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9127/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,752,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9128/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,752,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9129/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,752,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9130/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,752,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9131/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,753,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9132/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,753,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9133/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,753,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9134/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,753,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9135/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,753,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9136/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,754,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9137/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,754,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9138/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,754,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9139/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,754,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9140/500000]
+ optim/total_grad_norm=1.185
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,754,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9141/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,755,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9142/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,755,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9143/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,755,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9144/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,755,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9145/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,755,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9146/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,756,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9147/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,756,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9148/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,756,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9149/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,756,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9150/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,756,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9151/500000]
+ train/ActionNoiseL2Loss=0.0085
+ throughput/total_tokens=1,756,992,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9152/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,757,184,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9153/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,757,376,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9154/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,757,568,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9155/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,757,760,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9156/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,757,952,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9157/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,758,144,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=9158/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=1,758,336,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9159/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,758,528,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9160/500000]
+ optim/total_grad_norm=1.505
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,758,720,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9161/500000]
+ train/ActionNoiseL2Loss=0.0119
+ throughput/total_tokens=1,758,912,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9162/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,759,104,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9163/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,759,296,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9164/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,759,488,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9165/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,759,680,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9166/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,759,872,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9167/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,760,064,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9168/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,760,256,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9169/500000]
+ train/ActionNoiseL2Loss=0.0129
+ throughput/total_tokens=1,760,448,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9170/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,760,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9171/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,760,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9172/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,761,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9173/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,761,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9174/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,761,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9175/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,761,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9176/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,761,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9177/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,761,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9178/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,762,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9179/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,762,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9180/500000]
+ optim/total_grad_norm=0.9198
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,762,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9181/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,762,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9182/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,762,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9183/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,763,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9184/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,763,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9185/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,763,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9186/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,763,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9187/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,763,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9188/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,764,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9189/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,764,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9190/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,764,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9191/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,764,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9192/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,764,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9193/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,765,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9194/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,765,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9195/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,765,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9196/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,765,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9197/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,765,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9198/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,766,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9199/500000]
+ train/ActionNoiseL2Loss=0.0102
+ throughput/total_tokens=1,766,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9200/500000]
+ optim/total_grad_norm=1.218
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,766,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9201/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,766,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9202/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,766,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9203/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,766,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9204/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,767,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9205/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,767,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9206/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,767,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9207/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=1,767,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9208/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,767,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9209/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,768,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9210/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,768,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9211/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,768,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9212/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,768,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9213/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,768,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9214/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,769,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9215/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,769,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9216/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,769,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9217/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=1,769,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9218/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,769,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9219/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,770,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9220/500000]
+ optim/total_grad_norm=0.7004
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,770,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9221/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=1,770,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9222/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,770,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9223/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,770,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9224/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=1,771,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9225/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,771,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9226/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,771,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9227/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,771,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9228/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,771,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9229/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,771,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9230/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,772,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9231/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,772,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9232/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,772,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9233/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,772,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9234/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,772,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9235/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,773,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9236/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,773,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9237/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,773,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9238/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,773,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9239/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,773,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9240/500000]
+ optim/total_grad_norm=1.566
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,774,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9241/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,774,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9242/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,774,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9243/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,774,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9244/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,774,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9245/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,775,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9246/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,775,232,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9247/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,775,424,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9248/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,775,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9249/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,775,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9250/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=1,776,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9251/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,776,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9252/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,776,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9253/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,776,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9254/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,776,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9255/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,776,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9256/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,777,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9257/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,777,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9258/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,777,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9259/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,777,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9260/500000]
+ optim/total_grad_norm=1.186
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,777,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9261/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,778,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9262/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,778,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9263/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,778,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9264/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,778,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9265/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,778,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9266/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,779,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9267/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,779,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9268/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,779,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9269/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,779,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9270/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,779,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9271/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=1,780,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9272/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,780,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9273/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,780,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9274/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,780,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9275/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=1,780,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9276/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,780,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9277/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,781,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9278/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,781,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9279/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,781,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9280/500000]
+ optim/total_grad_norm=0.8708
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,781,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9281/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,781,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9282/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,782,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9283/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,782,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9284/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,782,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9285/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,782,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9286/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,782,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9287/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,783,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9288/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,783,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9289/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,783,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9290/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,783,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9291/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,783,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9292/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,784,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9293/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,784,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9294/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,784,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9295/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,784,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9296/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,784,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9297/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,785,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9298/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,785,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9299/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,785,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9300/500000]
+ optim/total_grad_norm=1.323
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,785,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9301/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=1,785,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9302/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,785,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9303/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,786,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9304/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,786,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9305/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,786,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9306/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,786,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9307/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,786,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9308/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,787,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9309/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,787,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9310/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,787,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9311/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,787,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9312/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,787,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9313/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,788,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9314/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,788,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9315/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,788,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9316/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,788,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9317/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,788,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9318/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,789,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9319/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,789,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9320/500000]
+ optim/total_grad_norm=1.269
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,789,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9321/500000]
+ train/ActionNoiseL2Loss=0.0097
+ throughput/total_tokens=1,789,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9322/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,789,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9323/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,790,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9324/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,790,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9325/500000]
+ train/ActionNoiseL2Loss=0.0093
+ throughput/total_tokens=1,790,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9326/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,790,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9327/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,790,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9328/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,790,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9329/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,791,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9330/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,791,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9331/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,791,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9332/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,791,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9333/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,791,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9334/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,792,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9335/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,792,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9336/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,792,512,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9337/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,792,704,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9338/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,792,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9339/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,793,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9340/500000]
+ optim/total_grad_norm=2.039
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,793,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9341/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,793,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9342/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,793,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9343/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,793,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9344/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,794,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9345/500000]
+ train/ActionNoiseL2Loss=0.0111
+ throughput/total_tokens=1,794,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9346/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,794,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9347/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,794,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9348/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,794,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9349/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,795,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9350/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,795,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9351/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,795,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9352/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,795,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9353/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,795,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9354/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,795,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9355/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,796,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9356/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,796,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9357/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,796,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9358/500000]
+ train/ActionNoiseL2Loss=0.0102
+ throughput/total_tokens=1,796,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9359/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,796,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9360/500000]
+ optim/total_grad_norm=1.418
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,797,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9361/500000]
+ train/ActionNoiseL2Loss=0.0110
+ throughput/total_tokens=1,797,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9362/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,797,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9363/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,797,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9364/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,797,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9365/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,798,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9366/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,798,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9367/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,798,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9368/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,798,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9369/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,798,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9370/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,799,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9371/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,799,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9372/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,799,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9373/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,799,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9374/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,799,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9375/500000]
+ train/ActionNoiseL2Loss=0.0129
+ throughput/total_tokens=1,800,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9376/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,800,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9377/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,800,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9378/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,800,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9379/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,800,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9380/500000]
+ optim/total_grad_norm=1.378
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,800,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9381/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,801,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9382/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,801,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9383/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,801,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9384/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,801,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9385/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,801,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9386/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,802,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9387/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,802,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9388/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,802,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9389/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,802,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9390/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,802,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9391/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,803,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9392/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,803,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9393/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,803,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9394/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,803,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9395/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,803,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9396/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,804,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9397/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,804,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9398/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,804,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9399/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,804,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9400/500000]
+ optim/total_grad_norm=0.7781
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,804,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9401/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,804,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9402/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,805,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9403/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,805,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9404/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=1,805,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9405/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,805,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9406/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,805,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9407/500000]
+ train/ActionNoiseL2Loss=0.0117
+ throughput/total_tokens=1,806,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9408/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,806,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9409/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,806,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9410/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,806,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9411/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,806,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9412/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,807,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9413/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,807,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9414/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,807,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9415/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,807,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9416/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,807,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9417/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,808,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9418/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,808,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9419/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,808,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9420/500000]
+ optim/total_grad_norm=0.9179
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,808,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9421/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,808,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9422/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,809,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9423/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,809,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9424/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,809,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9425/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,809,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9426/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,809,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9427/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,809,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9428/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,810,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9429/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,810,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9430/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,810,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9431/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,810,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9432/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,810,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9433/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,811,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9434/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,811,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9435/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,811,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9436/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,811,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9437/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,811,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9438/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,812,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9439/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,812,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9440/500000]
+ optim/total_grad_norm=0.7481
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,812,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9441/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,812,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9442/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,812,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9443/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,813,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9444/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,813,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9445/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,813,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9446/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,813,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9447/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,813,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9448/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,814,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9449/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,814,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9450/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,814,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9451/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,814,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9452/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,814,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9453/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,814,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9454/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,815,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9455/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,815,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9456/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,815,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9457/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,815,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9458/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,815,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9459/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,816,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9460/500000]
+ optim/total_grad_norm=1.413
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,816,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9461/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,816,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9462/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,816,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9463/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,816,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9464/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,817,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9465/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,817,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9466/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,817,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9467/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,817,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9468/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,817,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9469/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,818,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9470/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,818,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9471/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,818,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9472/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,818,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9473/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,818,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9474/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,819,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9475/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,819,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9476/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,819,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9477/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,819,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9478/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,819,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9479/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,819,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9480/500000]
+ optim/total_grad_norm=1.203
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,820,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9481/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,820,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9482/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,820,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9483/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,820,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9484/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,820,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9485/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,821,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9486/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,821,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9487/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,821,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9488/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,821,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9489/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,821,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9490/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,822,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9491/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,822,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9492/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,822,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9493/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,822,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9494/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,822,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9495/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,823,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9496/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,823,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9497/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=1,823,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9498/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,823,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9499/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,823,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9500/500000]
+ optim/total_grad_norm=1.431
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,824,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/05 [00:56:53] INFO | >> Saving config... checkpoint.py:608
+10/05 [00:57:54] INFO | >> Saving model state... checkpoint.py:796
+10/05 [00:59:06] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [01:00:37] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9501/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,824,192,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=9502/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=1,824,384,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=9503/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,824,576,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=9504/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,824,768,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=9505/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=1,824,960,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=9506/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,825,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9507/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,825,344,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=9508/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,825,536,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=9509/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,825,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9510/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,825,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9511/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,826,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=9512/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,826,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9513/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,826,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9514/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,826,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9515/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,826,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9516/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,827,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9517/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,827,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9518/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,827,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9519/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,827,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9520/500000]
+ optim/total_grad_norm=1.506
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,827,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9521/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,828,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9522/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,828,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9523/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=1,828,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9524/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,828,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9525/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,828,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9526/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,828,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9527/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,829,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9528/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,829,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9529/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=1,829,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9530/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,829,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9531/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,829,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9532/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,830,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9533/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,830,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9534/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,830,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9535/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,830,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9536/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,830,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9537/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,831,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9538/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,831,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9539/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,831,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9540/500000]
+ optim/total_grad_norm=0.8179
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,831,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9541/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,831,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9542/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,832,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9543/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,832,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9544/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,832,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9545/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,832,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9546/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,832,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9547/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,833,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9548/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,833,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9549/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,833,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9550/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,833,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9551/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,833,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9552/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,833,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9553/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,834,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9554/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,834,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9555/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,834,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9556/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,834,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9557/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,834,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9558/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=1,835,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9559/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,835,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9560/500000]
+ optim/total_grad_norm=1.345
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,835,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9561/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,835,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9562/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,835,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9563/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,836,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9564/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,836,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9565/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,836,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9566/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,836,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9567/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,836,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9568/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,837,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9569/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,837,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9570/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,837,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9571/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,837,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9572/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,837,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9573/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,838,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9574/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,838,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9575/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,838,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9576/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,838,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9577/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,838,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9578/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,838,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9579/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,839,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9580/500000]
+ optim/total_grad_norm=0.8023
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,839,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9581/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,839,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9582/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,839,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9583/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,839,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9584/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,840,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9585/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,840,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9586/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,840,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9587/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,840,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9588/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,840,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9589/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,841,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9590/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,841,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9591/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,841,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9592/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,841,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9593/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,841,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9594/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,842,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9595/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,842,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9596/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,842,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9597/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,842,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9598/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,842,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9599/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,843,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9600/500000]
+ optim/total_grad_norm=1.174
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,843,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9601/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,843,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9602/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,843,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9603/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,843,776,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9604/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,843,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9605/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,844,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9606/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,844,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9607/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,844,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9608/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,844,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9609/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,844,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9610/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,845,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9611/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,845,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9612/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,845,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9613/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,845,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9614/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,845,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9615/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,846,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9616/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,846,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9617/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,846,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9618/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,846,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9619/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=1,846,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9620/500000]
+ optim/total_grad_norm=0.7751
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,847,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9621/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,847,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9622/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,847,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9623/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,847,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9624/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,847,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9625/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,848,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9626/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,848,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9627/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,848,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9628/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,848,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9629/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,848,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9630/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,848,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9631/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,849,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9632/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,849,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9633/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,849,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9634/500000]
+ train/ActionNoiseL2Loss=0.0129
+ throughput/total_tokens=1,849,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9635/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,849,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9636/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,850,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9637/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,850,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9638/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,850,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9639/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,850,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9640/500000]
+ optim/total_grad_norm=1.431
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,850,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9641/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,851,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9642/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=1,851,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9643/500000]
+ train/ActionNoiseL2Loss=0.0119
+ throughput/total_tokens=1,851,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9644/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,851,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9645/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,851,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9646/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=1,852,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9647/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,852,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9648/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,852,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9649/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,852,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9650/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,852,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9651/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,852,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9652/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,853,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9653/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,853,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9654/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,853,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9655/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,853,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9656/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,853,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9657/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,854,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9658/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,854,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9659/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,854,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9660/500000]
+ optim/total_grad_norm=1.211
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,854,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9661/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,854,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9662/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,855,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9663/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,855,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9664/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,855,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9665/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,855,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9666/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,855,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9667/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,856,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9668/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,856,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9669/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,856,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9670/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,856,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9671/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,856,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9672/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,857,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9673/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,857,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9674/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,857,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9675/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,857,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9676/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,857,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9677/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,857,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9678/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,858,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9679/500000]
+ train/ActionNoiseL2Loss=0.0100
+ throughput/total_tokens=1,858,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9680/500000]
+ optim/total_grad_norm=1.019
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,858,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9681/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,858,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9682/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,858,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9683/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,859,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9684/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,859,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9685/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,859,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9686/500000]
+ train/ActionNoiseL2Loss=0.0102
+ throughput/total_tokens=1,859,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9687/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,859,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9688/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,860,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9689/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,860,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9690/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,860,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9691/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,860,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9692/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,860,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9693/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,861,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9694/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,861,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9695/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,861,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9696/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,861,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9697/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,861,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9698/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,862,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9699/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,862,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9700/500000]
+ optim/total_grad_norm=2.675
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,862,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9701/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,862,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9702/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,862,784,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9703/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,862,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9704/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,863,168,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9705/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,863,360,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9706/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,863,552,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9707/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,863,744,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9708/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,863,936,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9709/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,864,128,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9710/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,864,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9711/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,864,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9712/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,864,704,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9713/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,864,896,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9714/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,865,088,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9715/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,865,280,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9716/500000]
+ train/ActionNoiseL2Loss=0.0099
+ throughput/total_tokens=1,865,472,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9717/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,865,664,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9718/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,865,856,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9719/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,866,048,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9720/500000]
+ optim/total_grad_norm=1.082
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,866,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9721/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,866,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9722/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,866,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9723/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,866,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9724/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,867,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9725/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,867,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9726/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,867,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9727/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,867,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9728/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,867,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9729/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,867,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9730/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,868,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9731/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,868,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9732/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,868,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9733/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,868,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9734/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,868,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9735/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,869,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9736/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,869,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9737/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,869,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9738/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,869,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9739/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,869,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9740/500000]
+ optim/total_grad_norm=0.6499
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=1,870,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9741/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,870,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9742/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,870,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9743/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,870,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9744/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,870,848,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9745/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,871,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9746/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,871,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9747/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,871,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9748/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,871,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9749/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,871,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9750/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,872,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9751/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,872,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9752/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,872,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9753/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=1,872,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9754/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,872,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9755/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,872,960,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9756/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,873,152,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9757/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,873,344,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9758/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,873,536,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9759/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,873,728,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9760/500000]
+ optim/total_grad_norm=1.268
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,873,920,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9761/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,874,112,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9762/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,874,304,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9763/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,874,496,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9764/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,874,688,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9765/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,874,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9766/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,875,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9767/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,875,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9768/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,875,456,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9769/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,875,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9770/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,875,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9771/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,876,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9772/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=1,876,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9773/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,876,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9774/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,876,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9775/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,876,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9776/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,876,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9777/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,877,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9778/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,877,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9779/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,877,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9780/500000]
+ optim/total_grad_norm=1.017
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,877,760,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9781/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,877,952,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9782/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,878,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9783/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,878,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9784/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=1,878,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9785/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,878,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9786/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,878,912,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9787/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,879,104,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9788/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,879,296,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9789/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,879,488,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9790/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=1,879,680,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9791/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,879,872,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9792/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,880,064,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9793/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,880,256,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9794/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,880,448,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9795/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,880,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9796/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,880,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9797/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,881,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9798/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,881,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9799/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,881,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9800/500000]
+ optim/total_grad_norm=0.7425
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=1,881,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9801/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,881,792,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9802/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,881,984,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9803/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,882,176,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9804/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,882,368,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9805/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,882,560,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9806/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,882,752,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9807/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,882,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9808/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,883,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9809/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,883,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9810/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,883,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9811/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,883,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9812/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,883,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9813/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,884,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9814/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,884,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9815/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,884,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9816/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,884,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9817/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,884,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9818/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,885,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9819/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,885,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9820/500000]
+ optim/total_grad_norm=1.054
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,885,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9821/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,885,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9822/500000]
+ train/ActionNoiseL2Loss=0.1324
+ throughput/total_tokens=1,885,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9823/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,886,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9824/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,886,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9825/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,886,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9826/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,886,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9827/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,886,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9828/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,886,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9829/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,887,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=9830/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,887,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9831/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,887,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9832/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,887,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9833/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,887,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9834/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,888,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9835/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,888,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9836/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,888,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9837/500000]
+ train/ActionNoiseL2Loss=0.0127
+ throughput/total_tokens=1,888,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9838/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,888,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9839/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,889,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9840/500000]
+ optim/total_grad_norm=0.9999
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,889,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9841/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,889,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9842/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,889,664,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9843/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,889,856,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9844/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,890,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9845/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=1,890,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9846/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=1,890,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9847/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,890,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9848/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,890,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9849/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,891,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9850/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,891,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9851/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,891,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9852/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,891,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9853/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,891,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9854/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,891,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9855/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,892,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9856/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,892,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9857/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=1,892,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9858/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,892,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9859/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=1,892,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9860/500000]
+ optim/total_grad_norm=0.9088
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,893,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9861/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,893,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9862/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,893,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9863/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,893,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9864/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,893,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9865/500000]
+ train/ActionNoiseL2Loss=0.0107
+ throughput/total_tokens=1,894,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9866/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,894,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9867/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,894,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9868/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,894,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9869/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,894,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9870/500000]
+ train/ActionNoiseL2Loss=0.0097
+ throughput/total_tokens=1,895,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9871/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,895,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9872/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,895,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9873/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,895,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9874/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,895,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9875/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,896,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9876/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,896,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9877/500000]
+ train/ActionNoiseL2Loss=0.0103
+ throughput/total_tokens=1,896,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9878/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,896,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9879/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,896,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9880/500000]
+ optim/total_grad_norm=1.276
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,896,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9881/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,897,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9882/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,897,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9883/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,897,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9884/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,897,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9885/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,897,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9886/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=1,898,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9887/500000]
+ train/ActionNoiseL2Loss=0.0092
+ throughput/total_tokens=1,898,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9888/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,898,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9889/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,898,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9890/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,898,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9891/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,899,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9892/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,899,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9893/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,899,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9894/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=1,899,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9895/500000]
+ train/ActionNoiseL2Loss=0.0110
+ throughput/total_tokens=1,899,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9896/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,900,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9897/500000]
+ train/ActionNoiseL2Loss=0.0085
+ throughput/total_tokens=1,900,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9898/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,900,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9899/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=1,900,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9900/500000]
+ optim/total_grad_norm=0.8295
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,900,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=9901/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,900,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9902/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,901,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9903/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,901,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9904/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,901,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9905/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,901,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9906/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,901,952,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9907/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,902,144,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9908/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=1,902,336,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9909/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=1,902,528,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9910/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,902,720,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9911/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,902,912,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9912/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,903,104,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9913/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,903,296,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9914/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,903,488,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9915/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,903,680,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9916/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=1,903,872,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9917/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,904,064,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9918/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=1,904,256,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9919/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,904,448,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9920/500000]
+ optim/total_grad_norm=0.5818
+ train/ActionNoiseL2Loss=0.0098
+ throughput/total_tokens=1,904,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9921/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=1,904,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9922/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,905,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9923/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,905,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9924/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,905,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9925/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,905,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9926/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,905,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9927/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,905,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9928/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,906,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9929/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,906,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9930/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,906,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9931/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,906,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9932/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,906,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9933/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=1,907,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9934/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,907,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9935/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=1,907,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9936/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,907,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9937/500000]
+ train/ActionNoiseL2Loss=0.0106
+ throughput/total_tokens=1,907,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9938/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,908,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9939/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,908,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9940/500000]
+ optim/total_grad_norm=1.483
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,908,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9941/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,908,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9942/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,908,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9943/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,909,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9944/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,909,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9945/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,909,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9946/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,909,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9947/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,909,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9948/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=1,910,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9949/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,910,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9950/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,910,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9951/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,910,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9952/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,910,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9953/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,910,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9954/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,911,168,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9955/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,911,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9956/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,911,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9957/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,911,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9958/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,911,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9959/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,912,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9960/500000]
+ optim/total_grad_norm=1.551
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,912,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=9961/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,912,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9962/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,912,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9963/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,912,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9964/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,913,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9965/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,913,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9966/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,913,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9967/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,913,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9968/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,913,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9969/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,914,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9970/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,914,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9971/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,914,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9972/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,914,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9973/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=1,914,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9974/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,915,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9975/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,915,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9976/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,915,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9977/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=1,915,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9978/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,915,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9979/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,915,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9980/500000]
+ optim/total_grad_norm=0.8552
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,916,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9981/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,916,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9982/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,916,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9983/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,916,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9984/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,916,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9985/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,917,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9986/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=1,917,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9987/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,917,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9988/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,917,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9989/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,917,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9990/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,918,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=9991/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=1,918,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9992/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,918,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9993/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,918,656,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=9994/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,918,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9995/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,919,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9996/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=1,919,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9997/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,919,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9998/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,919,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=9999/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,919,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10000/500000]
+ optim/total_grad_norm=1.725
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,920,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+10/05 [03:55:12] INFO | >> Saving config... checkpoint.py:608
+10/05 [03:55:46] INFO | >> Saving model state... checkpoint.py:796
+10/05 [03:56:59] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [03:58:31] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10001/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=1,920,192,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10002/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,920,384,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10003/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,920,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=10004/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,920,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=10005/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,920,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10006/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,921,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=10007/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,921,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10008/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,921,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10009/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,921,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10010/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=1,921,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10011/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=1,922,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10012/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,922,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10013/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,922,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10014/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,922,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10015/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,922,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10016/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,923,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10017/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,923,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10018/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,923,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10019/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,923,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10020/500000]
+ optim/total_grad_norm=1.247
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,923,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10021/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,924,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10022/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,924,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10023/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,924,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10024/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,924,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10025/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,924,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10026/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,924,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10027/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,925,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10028/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,925,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10029/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,925,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10030/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,925,760,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10031/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,925,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10032/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,926,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10033/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,926,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10034/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,926,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10035/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,926,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10036/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,926,912,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10037/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,927,104,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10038/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,927,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10039/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,927,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10040/500000]
+ optim/total_grad_norm=1.444
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,927,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10041/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,927,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10042/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=1,928,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10043/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,928,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10044/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,928,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10045/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,928,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10046/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,928,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10047/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,929,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10048/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,929,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10049/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,929,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10050/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,929,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10051/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,929,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10052/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,929,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10053/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,930,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10054/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,930,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10055/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,930,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10056/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=1,930,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10057/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,930,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10058/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,931,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10059/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=1,931,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10060/500000]
+ optim/total_grad_norm=0.8373
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=1,931,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=10061/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=1,931,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10062/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,931,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10063/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,932,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10064/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=1,932,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10065/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,932,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10066/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=1,932,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10067/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,932,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10068/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,933,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10069/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,933,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10070/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,933,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10071/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,933,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10072/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,933,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10073/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=1,934,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10074/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,934,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10075/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,934,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10076/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,934,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10077/500000]
+ train/ActionNoiseL2Loss=0.0096
+ throughput/total_tokens=1,934,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10078/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,934,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10079/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,935,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10080/500000]
+ optim/total_grad_norm=0.9180
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,935,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10081/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,935,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10082/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,935,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10083/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,935,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10084/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,936,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10085/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,936,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10086/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,936,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10087/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,936,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10088/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,936,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10089/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=1,937,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10090/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,937,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10091/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,937,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10092/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,937,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10093/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=1,937,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10094/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,938,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10095/500000]
+ train/ActionNoiseL2Loss=0.0081
+ throughput/total_tokens=1,938,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10096/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=1,938,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10097/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=1,938,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10098/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=1,938,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10099/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,939,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10100/500000]
+ optim/total_grad_norm=0.7414
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,939,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10101/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=1,939,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10102/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,939,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10103/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,939,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10104/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=1,939,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10105/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,940,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10106/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,940,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10107/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,940,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10108/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,940,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10109/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,940,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10110/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,941,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=10111/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,941,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10112/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=1,941,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10113/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,941,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10114/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,941,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10115/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=1,942,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10116/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,942,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10117/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=1,942,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10118/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,942,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10119/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,942,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10120/500000]
+ optim/total_grad_norm=0.9099
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,943,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10121/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,943,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10122/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,943,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10123/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,943,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10124/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,943,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10125/500000]
+ train/ActionNoiseL2Loss=0.0127
+ throughput/total_tokens=1,944,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10126/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,944,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10127/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,944,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10128/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=1,944,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10129/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,944,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10130/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,944,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10131/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,945,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10132/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,945,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10133/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,945,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10134/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=1,945,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10135/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,945,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10136/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,946,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10137/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,946,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10138/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,946,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10139/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,946,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10140/500000]
+ optim/total_grad_norm=1.258
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,946,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10141/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,947,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10142/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,947,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10143/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,947,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10144/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,947,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10145/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,947,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10146/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=1,948,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10147/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=1,948,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10148/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,948,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10149/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,948,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10150/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,948,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10151/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,948,992,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10152/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,949,184,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10153/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,949,376,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10154/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=1,949,568,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10155/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=1,949,760,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10156/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,949,952,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10157/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,950,144,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10158/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,950,336,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10159/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,950,528,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10160/500000]
+ optim/total_grad_norm=1.066
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,950,720,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=46,467
+[step=10161/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,950,912,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10162/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=1,951,104,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10163/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,951,296,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10164/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,951,488,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10165/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,951,680,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10166/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,951,872,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10167/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,952,064,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10168/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,952,256,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10169/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,952,448,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=10170/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,952,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10171/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,952,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10172/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,953,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10173/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,953,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10174/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,953,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10175/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,953,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10176/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,953,792,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10177/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,953,984,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10178/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,954,176,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10179/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=1,954,368,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10180/500000]
+ optim/total_grad_norm=1.299
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,954,560,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10181/500000]
+ train/ActionNoiseL2Loss=0.0105
+ throughput/total_tokens=1,954,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10182/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,954,944,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10183/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,955,136,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10184/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,955,328,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10185/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,955,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10186/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,955,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10187/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,955,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10188/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=1,956,096,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10189/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,956,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10190/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=1,956,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10191/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,956,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10192/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,956,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10193/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,957,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10194/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,957,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10195/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,957,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10196/500000]
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=1,957,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10197/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,957,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10198/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,958,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10199/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,958,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10200/500000]
+ optim/total_grad_norm=0.8686
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,958,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10201/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,958,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10202/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,958,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10203/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=1,958,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10204/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,959,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10205/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=1,959,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10206/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,959,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10207/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=1,959,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10208/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,959,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10209/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,960,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10210/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,960,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10211/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,960,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10212/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,960,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10213/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,960,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10214/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,961,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10215/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=1,961,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10216/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,961,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10217/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=1,961,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10218/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,961,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10219/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=1,962,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10220/500000]
+ optim/total_grad_norm=1.065
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,962,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10221/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,962,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10222/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,962,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10223/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=1,962,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10224/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,963,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10225/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,963,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10226/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,963,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10227/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,963,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10228/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,963,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10229/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,963,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10230/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,964,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10231/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,964,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10232/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,964,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10233/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,964,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10234/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,964,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10235/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,965,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10236/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,965,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10237/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,965,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10238/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,965,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10239/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,965,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10240/500000]
+ optim/total_grad_norm=0.8166
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,966,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10241/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=1,966,272,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10242/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,966,464,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10243/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,966,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10244/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,966,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10245/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,967,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10246/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=1,967,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10247/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,967,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10248/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=1,967,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10249/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,967,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10250/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,968,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10251/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,968,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10252/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,968,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10253/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,968,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10254/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,968,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10255/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,968,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10256/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,969,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10257/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,969,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10258/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,969,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10259/500000]
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=1,969,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10260/500000]
+ optim/total_grad_norm=0.4785
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,969,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10261/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,970,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10262/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=1,970,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10263/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=1,970,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10264/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=1,970,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10265/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,970,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10266/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,971,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10267/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=1,971,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10268/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,971,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10269/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,971,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10270/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=1,971,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10271/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,972,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10272/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,972,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10273/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,972,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10274/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,972,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10275/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,972,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10276/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,972,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10277/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,973,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10278/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,973,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10279/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,973,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10280/500000]
+ optim/total_grad_norm=1.150
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=1,973,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10281/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,973,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10282/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,974,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10283/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,974,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10284/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,974,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10285/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=1,974,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10286/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,974,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10287/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,975,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10288/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,975,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10289/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,975,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10290/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=1,975,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10291/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,975,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10292/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=1,976,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10293/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=1,976,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10294/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=1,976,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10295/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,976,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10296/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=1,976,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10297/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=1,977,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10298/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=1,977,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10299/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=1,977,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10300/500000]
+ optim/total_grad_norm=0.4556
+ train/ActionNoiseL2Loss=0.0073
+ throughput/total_tokens=1,977,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10301/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,977,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10302/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=1,977,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10303/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,978,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10304/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=1,978,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10305/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,978,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10306/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,978,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10307/500000]
+ train/ActionNoiseL2Loss=0.0075
+ throughput/total_tokens=1,978,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10308/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,979,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10309/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,979,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10310/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,979,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=10311/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,979,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10312/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,979,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10313/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=1,980,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10314/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,980,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10315/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,980,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10316/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,980,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10317/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,980,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10318/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,981,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10319/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,981,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10320/500000]
+ optim/total_grad_norm=0.9946
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,981,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10321/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,981,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10322/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,981,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10323/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,982,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10324/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,982,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10325/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,982,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10326/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=1,982,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10327/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,982,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10328/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,982,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10329/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,983,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10330/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,983,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10331/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,983,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10332/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,983,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10333/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,983,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10334/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,984,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10335/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,984,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10336/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,984,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10337/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,984,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10338/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,984,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10339/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,985,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10340/500000]
+ optim/total_grad_norm=0.7891
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,985,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10341/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,985,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10342/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,985,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10343/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,985,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10344/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,986,048,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10345/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=1,986,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10346/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,986,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10347/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=1,986,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10348/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,986,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10349/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=1,987,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10350/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,987,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10351/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,987,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10352/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,987,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10353/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,987,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10354/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,987,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10355/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=1,988,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10356/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,988,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10357/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,988,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10358/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=1,988,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10359/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,988,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10360/500000]
+ optim/total_grad_norm=1.550
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,989,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10361/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,989,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10362/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,989,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10363/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,989,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10364/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,989,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10365/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,990,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10366/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,990,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10367/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,990,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10368/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,990,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10369/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,990,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10370/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,991,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10371/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,991,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10372/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,991,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10373/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,991,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10374/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,991,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10375/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=1,992,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10376/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,992,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10377/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,992,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10378/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,992,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10379/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=1,992,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10380/500000]
+ optim/total_grad_norm=1.324
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,992,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10381/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,993,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10382/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,993,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10383/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,993,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10384/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,993,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10385/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,993,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10386/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,994,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10387/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,994,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10388/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,994,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10389/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,994,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10390/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,994,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10391/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,995,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10392/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=1,995,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10393/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=1,995,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10394/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,995,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10395/500000]
+ train/ActionNoiseL2Loss=0.0127
+ throughput/total_tokens=1,995,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10396/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,996,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10397/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=1,996,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10398/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=1,996,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10399/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,996,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10400/500000]
+ optim/total_grad_norm=0.5499
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=1,996,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10401/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,996,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10402/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=1,997,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10403/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,997,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10404/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=1,997,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10405/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=1,997,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10406/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=1,997,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10407/500000]
+ train/ActionNoiseL2Loss=0.0102
+ throughput/total_tokens=1,998,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10408/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,998,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10409/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,998,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10410/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,998,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10411/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,998,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10412/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,999,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10413/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,999,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10414/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,999,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10415/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,999,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10416/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,999,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10417/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=2,000,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10418/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,000,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10419/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,000,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10420/500000]
+ optim/total_grad_norm=0.6280
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,000,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10421/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,000,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10422/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=2,001,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10423/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,001,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10424/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,001,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10425/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,001,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10426/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,001,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10427/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,001,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10428/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=2,002,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10429/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=2,002,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10430/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,002,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10431/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=2,002,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10432/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,002,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10433/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=2,003,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10434/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,003,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10435/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=2,003,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10436/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,003,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10437/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,003,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10438/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=2,004,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10439/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=2,004,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10440/500000]
+ optim/total_grad_norm=0.9549
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,004,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10441/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,004,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10442/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,004,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10443/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,005,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10444/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,005,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10445/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,005,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10446/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,005,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10447/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,005,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10448/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,006,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10449/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,006,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10450/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,006,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10451/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=2,006,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10452/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,006,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10453/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,006,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10454/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=2,007,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10455/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=2,007,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10456/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,007,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10457/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,007,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10458/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=2,007,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10459/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,008,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10460/500000]
+ optim/total_grad_norm=2.309
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=2,008,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10461/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=2,008,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10462/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,008,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10463/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,008,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10464/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,009,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10465/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,009,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10466/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,009,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10467/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=2,009,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10468/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,009,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10469/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=2,010,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10470/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,010,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10471/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=2,010,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10472/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=2,010,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10473/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,010,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10474/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,011,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10475/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=2,011,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10476/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=2,011,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10477/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,011,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10478/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,011,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10479/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,011,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10480/500000]
+ optim/total_grad_norm=1.226
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=2,012,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10481/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,012,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10482/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,012,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10483/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,012,736,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10484/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,012,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10485/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,013,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10486/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=2,013,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10487/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,013,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10488/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,013,696,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10489/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,013,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10490/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,014,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10491/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=2,014,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10492/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=2,014,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10493/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,014,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10494/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=2,014,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10495/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,015,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10496/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,015,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10497/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,015,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10498/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,015,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10499/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,015,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10500/500000]
+ optim/total_grad_norm=1.167
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=2,016,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/05 [06:53:03] INFO | >> Saving config... checkpoint.py:608
+10/05 [06:53:54] INFO | >> Saving model state... checkpoint.py:796
+10/05 [06:55:02] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [06:56:34] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10501/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,016,192,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=10502/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=2,016,384,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=10503/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,016,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=10504/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,016,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=10505/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=2,016,960,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=10506/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,017,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=10507/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,017,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10508/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,017,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=10509/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,017,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10510/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,017,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10511/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,018,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10512/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=2,018,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10513/500000]
+ train/ActionNoiseL2Loss=0.0105
+ throughput/total_tokens=2,018,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10514/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,018,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10515/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,018,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10516/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=2,019,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10517/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,019,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10518/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,019,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10519/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,019,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10520/500000]
+ optim/total_grad_norm=0.8387
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,019,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10521/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,020,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10522/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=2,020,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10523/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=2,020,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10524/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,020,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10525/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,020,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10526/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,020,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10527/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,021,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10528/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,021,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10529/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=2,021,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10530/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,021,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10531/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,021,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10532/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=2,022,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10533/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=2,022,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10534/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,022,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10535/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,022,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10536/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=2,022,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10537/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,023,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10538/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,023,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10539/500000]
+ train/ActionNoiseL2Loss=0.0111
+ throughput/total_tokens=2,023,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10540/500000]
+ optim/total_grad_norm=1.488
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,023,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10541/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=2,023,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10542/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,024,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10543/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,024,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10544/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,024,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10545/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,024,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10546/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,024,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10547/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,025,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10548/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,025,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10549/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=2,025,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10550/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=2,025,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10551/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,025,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10552/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=2,025,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10553/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=2,026,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10554/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,026,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10555/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=2,026,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10556/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,026,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10557/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=2,026,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10558/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,027,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10559/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=2,027,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10560/500000]
+ optim/total_grad_norm=1.182
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,027,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10561/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,027,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10562/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,027,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10563/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=2,028,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10564/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,028,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10565/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,028,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10566/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,028,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10567/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=2,028,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10568/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,029,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10569/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,029,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10570/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,029,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10571/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,029,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10572/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,029,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10573/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,030,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10574/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=2,030,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10575/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,030,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10576/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,030,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10577/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=2,030,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10578/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,030,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10579/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,031,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10580/500000]
+ optim/total_grad_norm=0.9944
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,031,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10581/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,031,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10582/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,031,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10583/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,031,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10584/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,032,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10585/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,032,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10586/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,032,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10587/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,032,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10588/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,032,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10589/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,033,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10590/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,033,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10591/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,033,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10592/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,033,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10593/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=2,033,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10594/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=2,034,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10595/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,034,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10596/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,034,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10597/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,034,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10598/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,034,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10599/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,035,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10600/500000]
+ optim/total_grad_norm=1.073
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,035,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10601/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=2,035,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10602/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,035,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10603/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,035,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10604/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=2,035,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10605/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=2,036,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10606/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=2,036,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10607/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=2,036,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10608/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,036,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10609/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,036,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10610/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,037,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10611/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,037,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10612/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,037,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10613/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,037,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10614/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,037,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10615/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,038,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10616/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,038,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10617/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,038,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10618/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=2,038,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10619/500000]
+ train/ActionNoiseL2Loss=0.0096
+ throughput/total_tokens=2,038,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10620/500000]
+ optim/total_grad_norm=0.5850
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,039,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10621/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=2,039,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10622/500000]
+ train/ActionNoiseL2Loss=0.0096
+ throughput/total_tokens=2,039,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10623/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=2,039,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10624/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,039,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10625/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,040,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10626/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,040,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10627/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,040,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10628/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=2,040,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10629/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=2,040,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10630/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,040,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10631/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,041,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10632/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,041,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10633/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=2,041,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10634/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,041,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10635/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,041,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10636/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,042,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10637/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,042,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10638/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,042,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10639/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=2,042,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10640/500000]
+ optim/total_grad_norm=1.121
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,042,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10641/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=2,043,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10642/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,043,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10643/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,043,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10644/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,043,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10645/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,043,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10646/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,044,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10647/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,044,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10648/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,044,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10649/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,044,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10650/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=2,044,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10651/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=2,044,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10652/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,045,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10653/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,045,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10654/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,045,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10655/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,045,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10656/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,045,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10657/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,046,144,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10658/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=2,046,336,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10659/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,046,528,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10660/500000]
+ optim/total_grad_norm=0.8576
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,046,720,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=46,467
+[step=10661/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,046,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10662/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,047,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10663/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,047,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10664/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,047,488,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10665/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,047,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10666/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,047,872,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10667/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,048,064,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10668/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,048,256,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10669/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,048,448,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10670/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,048,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10671/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,048,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10672/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,049,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10673/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,049,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10674/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=2,049,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10675/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,049,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10676/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=2,049,792,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10677/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,049,984,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10678/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,050,176,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10679/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,050,368,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10680/500000]
+ optim/total_grad_norm=1.935
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=2,050,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10681/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,050,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10682/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,050,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10683/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,051,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10684/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,051,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10685/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,051,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10686/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,051,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10687/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,051,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10688/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,052,096,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10689/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,052,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10690/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,052,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10691/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,052,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10692/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=2,052,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10693/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=2,053,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10694/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,053,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10695/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=2,053,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10696/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,053,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10697/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,053,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10698/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,054,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10699/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=2,054,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10700/500000]
+ optim/total_grad_norm=0.9197
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,054,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10701/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,054,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10702/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,054,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10703/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,054,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10704/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,055,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10705/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=2,055,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10706/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,055,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10707/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,055,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10708/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,055,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10709/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,056,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10710/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,056,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10711/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,056,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10712/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,056,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10713/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=2,056,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10714/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,057,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10715/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,057,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10716/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,057,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10717/500000]
+ train/ActionNoiseL2Loss=0.0127
+ throughput/total_tokens=2,057,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10718/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,057,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10719/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,058,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10720/500000]
+ optim/total_grad_norm=0.6251
+ train/ActionNoiseL2Loss=0.0133
+ throughput/total_tokens=2,058,240,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10721/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,058,432,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10722/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=2,058,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10723/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=2,058,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10724/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,059,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10725/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=2,059,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10726/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,059,392,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10727/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,059,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10728/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,059,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10729/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=2,059,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10730/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,060,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10731/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,060,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10732/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,060,544,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10733/500000]
+ train/ActionNoiseL2Loss=0.0103
+ throughput/total_tokens=2,060,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10734/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,060,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10735/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,061,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10736/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,061,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10737/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,061,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10738/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=2,061,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10739/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=2,061,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10740/500000]
+ optim/total_grad_norm=0.7677
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,062,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10741/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,062,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10742/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=2,062,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10743/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=2,062,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10744/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=2,062,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10745/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,063,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10746/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=2,063,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10747/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,063,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10748/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,063,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10749/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=2,063,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10750/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=2,064,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10751/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,064,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10752/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,064,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10753/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,064,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10754/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,064,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10755/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=2,064,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10756/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,065,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10757/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,065,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10758/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=2,065,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10759/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,065,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10760/500000]
+ optim/total_grad_norm=1.830
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,065,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10761/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,066,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10762/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=2,066,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10763/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=2,066,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10764/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,066,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10765/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,066,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10766/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=2,067,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10767/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,067,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10768/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,067,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10769/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=2,067,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10770/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,067,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10771/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=2,068,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10772/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,068,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10773/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,068,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10774/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,068,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10775/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=2,068,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10776/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,068,992,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10777/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,069,184,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10778/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,069,376,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10779/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,069,568,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10780/500000]
+ optim/total_grad_norm=0.7064
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,069,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10781/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=2,069,952,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10782/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,070,144,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10783/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=2,070,336,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10784/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,070,528,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10785/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=2,070,720,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10786/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,070,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10787/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,071,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10788/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,071,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10789/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,071,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10790/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,071,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10791/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,071,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10792/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,072,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10793/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,072,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10794/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,072,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10795/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,072,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10796/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,072,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10797/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,073,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10798/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,073,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10799/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,073,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10800/500000]
+ optim/total_grad_norm=0.8286
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,073,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10801/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,073,792,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10802/500000]
+ train/ActionNoiseL2Loss=0.0127
+ throughput/total_tokens=2,073,984,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10803/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,074,176,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10804/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,074,368,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10805/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,074,560,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10806/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=2,074,752,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10807/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=2,074,944,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10808/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,075,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10809/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,075,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10810/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=2,075,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=46,467
+[step=10811/500000]
+ train/ActionNoiseL2Loss=0.0105
+ throughput/total_tokens=2,075,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10812/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=2,075,904,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10813/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,076,096,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10814/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,076,288,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10815/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,076,480,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10816/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=2,076,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10817/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,076,864,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10818/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,077,056,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10819/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,077,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10820/500000]
+ optim/total_grad_norm=0.8464
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=2,077,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10821/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,077,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10822/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,077,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10823/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,078,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10824/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,078,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10825/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,078,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10826/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,078,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10827/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,078,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10828/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,078,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10829/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,079,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10830/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,079,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10831/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,079,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10832/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=2,079,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10833/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=2,079,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10834/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,080,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10835/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,080,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10836/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,080,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10837/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,080,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10838/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=2,080,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10839/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,081,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10840/500000]
+ optim/total_grad_norm=1.096
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=2,081,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10841/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=2,081,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10842/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,081,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10843/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=2,081,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10844/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,082,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10845/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,082,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10846/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=2,082,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10847/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,082,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10848/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,082,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10849/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,083,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10850/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=2,083,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10851/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=2,083,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10852/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,083,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10853/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,083,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10854/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,083,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10855/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,084,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10856/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,084,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10857/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,084,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10858/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,084,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10859/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,084,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10860/500000]
+ optim/total_grad_norm=1.383
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,085,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10861/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,085,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10862/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=2,085,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10863/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,085,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10864/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,085,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10865/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,086,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10866/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,086,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10867/500000]
+ train/ActionNoiseL2Loss=0.0122
+ throughput/total_tokens=2,086,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10868/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,086,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10869/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,086,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10870/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,087,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10871/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,087,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10872/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,087,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10873/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=2,087,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10874/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,087,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10875/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,088,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10876/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,088,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10877/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=2,088,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10878/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,088,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10879/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=2,088,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10880/500000]
+ optim/total_grad_norm=0.7648
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,088,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10881/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,089,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10882/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,089,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10883/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,089,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10884/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,089,728,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10885/500000]
+ train/ActionNoiseL2Loss=0.0118
+ throughput/total_tokens=2,089,920,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10886/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=2,090,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10887/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=2,090,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10888/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,090,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10889/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,090,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10890/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,090,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10891/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,091,072,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10892/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,091,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10893/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,091,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10894/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,091,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10895/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,091,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10896/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,092,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10897/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,092,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10898/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,092,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10899/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,092,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=10900/500000]
+ optim/total_grad_norm=1.411
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=2,092,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10901/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,092,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10902/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,093,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10903/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=2,093,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10904/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=2,093,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10905/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,093,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10906/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,093,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10907/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,094,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10908/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,094,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10909/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,094,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10910/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=2,094,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=10911/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=2,094,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10912/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=2,095,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10913/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,095,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10914/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,095,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10915/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,095,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10916/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=2,095,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10917/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=2,096,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10918/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=2,096,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10919/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,096,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10920/500000]
+ optim/total_grad_norm=0.6111
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,096,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10921/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=2,096,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10922/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,097,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10923/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=2,097,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10924/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,097,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10925/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,097,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10926/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,097,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10927/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,097,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10928/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,098,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10929/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,098,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10930/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,098,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10931/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,098,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10932/500000]
+ train/ActionNoiseL2Loss=0.0105
+ throughput/total_tokens=2,098,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10933/500000]
+ train/ActionNoiseL2Loss=0.0074
+ throughput/total_tokens=2,099,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10934/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,099,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10935/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,099,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10936/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,099,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10937/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=2,099,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10938/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,100,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10939/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,100,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10940/500000]
+ optim/total_grad_norm=1.106
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,100,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10941/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=2,100,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10942/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,100,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10943/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=2,101,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10944/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,101,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10945/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,101,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10946/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,101,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10947/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,101,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10948/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,102,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10949/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,102,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10950/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,102,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10951/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=2,102,592,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10952/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,102,784,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10953/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,102,976,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10954/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,103,168,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10955/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,103,360,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10956/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=2,103,552,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10957/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,103,744,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10958/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,103,936,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10959/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,104,128,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10960/500000]
+ optim/total_grad_norm=1.535
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=2,104,320,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+ System/Peak GPU Memory (MB)=46,467
+[step=10961/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=2,104,512,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10962/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,104,704,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=10963/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=2,104,896,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=10964/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,105,088,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=10965/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,105,280,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=10966/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,105,472,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10967/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=2,105,664,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10968/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,105,856,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=10969/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,106,048,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=10970/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=2,106,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=10971/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,106,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10972/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=2,106,624,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10973/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,106,816,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10974/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,107,008,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10975/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,107,200,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10976/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,107,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10977/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,107,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10978/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,107,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10979/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,107,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10980/500000]
+ optim/total_grad_norm=1.238
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=2,108,160,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10981/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,108,352,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10982/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,108,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10983/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=2,108,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10984/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,108,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10985/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=2,109,120,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10986/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,109,312,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10987/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,109,504,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10988/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=2,109,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10989/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,109,888,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10990/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,110,080,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=10991/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,110,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10992/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,110,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10993/500000]
+ train/ActionNoiseL2Loss=0.0098
+ throughput/total_tokens=2,110,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10994/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,110,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10995/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,111,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10996/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=2,111,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10997/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,111,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10998/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,111,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=10999/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,111,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11000/500000]
+ optim/total_grad_norm=1.433
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=2,112,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/05 [09:51:13] INFO | >> Saving config... checkpoint.py:608
+10/05 [09:51:49] INFO | >> Saving model state... checkpoint.py:796
+10/05 [09:52:58] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [09:54:32] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11001/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=2,112,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11002/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,112,384,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=11003/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,112,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=11004/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=2,112,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11005/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,112,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=11006/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,113,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11007/500000]
+ train/ActionNoiseL2Loss=0.0206
+ throughput/total_tokens=2,113,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11008/500000]
+ train/ActionNoiseL2Loss=0.0113
+ throughput/total_tokens=2,113,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11009/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,113,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11010/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=2,113,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11011/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,114,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11012/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=2,114,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11013/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=2,114,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11014/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,114,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11015/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,114,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11016/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,115,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11017/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,115,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11018/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,115,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11019/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,115,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11020/500000]
+ optim/total_grad_norm=1.281
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,115,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11021/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,116,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11022/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,116,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11023/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=2,116,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11024/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,116,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11025/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,116,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11026/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,116,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11027/500000]
+ train/ActionNoiseL2Loss=0.0113
+ throughput/total_tokens=2,117,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11028/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,117,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11029/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,117,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11030/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,117,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11031/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,117,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11032/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=2,118,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11033/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,118,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11034/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,118,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11035/500000]
+ train/ActionNoiseL2Loss=0.0122
+ throughput/total_tokens=2,118,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11036/500000]
+ train/ActionNoiseL2Loss=0.0126
+ throughput/total_tokens=2,118,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11037/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=2,119,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11038/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,119,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11039/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=2,119,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11040/500000]
+ optim/total_grad_norm=1.000
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,119,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11041/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,119,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11042/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,120,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11043/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,120,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11044/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,120,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11045/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,120,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11046/500000]
+ train/ActionNoiseL2Loss=0.0121
+ throughput/total_tokens=2,120,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11047/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=2,121,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11048/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,121,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11049/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,121,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11050/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,121,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11051/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,121,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11052/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,121,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11053/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,122,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11054/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=2,122,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11055/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=2,122,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11056/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=2,122,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11057/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,122,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11058/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,123,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11059/500000]
+ train/ActionNoiseL2Loss=0.0112
+ throughput/total_tokens=2,123,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11060/500000]
+ optim/total_grad_norm=0.5627
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,123,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11061/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=2,123,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11062/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,123,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11063/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=2,124,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11064/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=2,124,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11065/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,124,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11066/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,124,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11067/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=2,124,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11068/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,125,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11069/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=2,125,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11070/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=2,125,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11071/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,125,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11072/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,125,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11073/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=2,126,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11074/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,126,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11075/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=2,126,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11076/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=2,126,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11077/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,126,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11078/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,126,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11079/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,127,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11080/500000]
+ optim/total_grad_norm=1.119
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,127,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11081/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,127,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11082/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,127,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11083/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=2,127,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11084/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,128,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11085/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,128,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11086/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,128,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11087/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,128,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11088/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,128,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11089/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,129,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11090/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,129,280,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11091/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,129,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11092/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,129,664,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11093/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,129,856,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11094/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=2,130,048,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11095/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,130,240,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11096/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,130,432,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11097/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,130,624,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11098/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,130,816,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11099/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,131,008,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11100/500000]
+ optim/total_grad_norm=0.9979
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,131,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11101/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=2,131,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11102/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=2,131,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11103/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,131,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11104/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=2,131,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11105/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=2,132,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11106/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,132,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11107/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,132,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11108/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,132,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11109/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,132,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11110/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=2,133,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11111/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,133,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11112/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,133,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11113/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,133,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11114/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,133,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11115/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,134,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11116/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=2,134,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11117/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=2,134,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11118/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=2,134,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11119/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,134,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11120/500000]
+ optim/total_grad_norm=1.297
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,135,040,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11121/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=2,135,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11122/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,135,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11123/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,135,616,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11124/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=2,135,808,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11125/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,136,000,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11126/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,136,192,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11127/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=2,136,384,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11128/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=2,136,576,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11129/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,136,768,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11130/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,136,960,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11131/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,137,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11132/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,137,344,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11133/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,137,536,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11134/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,137,728,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11135/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,137,920,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11136/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,138,112,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11137/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,138,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11138/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,138,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11139/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=2,138,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11140/500000]
+ optim/total_grad_norm=1.253
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,138,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11141/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=2,139,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11142/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,139,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11143/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,139,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11144/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,139,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11145/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,139,840,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11146/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,140,032,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11147/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,140,224,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11148/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=2,140,416,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11149/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=2,140,608,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11150/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,140,800,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11151/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=2,140,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11152/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,141,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11153/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=2,141,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11154/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=2,141,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11155/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,141,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11156/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,141,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11157/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,142,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11158/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,142,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11159/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=2,142,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11160/500000]
+ optim/total_grad_norm=0.9862
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=2,142,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11161/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,142,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11162/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=2,143,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11163/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,143,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11164/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=2,143,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11165/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,143,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11166/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,143,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11167/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,144,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11168/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=2,144,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11169/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,144,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11170/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,144,640,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11171/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,144,832,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11172/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,145,024,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11173/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,145,216,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11174/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,145,408,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11175/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,145,600,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11176/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=2,145,792,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11177/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,145,984,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11178/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,146,176,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11179/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,146,368,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11180/500000]
+ optim/total_grad_norm=1.311
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,146,560,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11181/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,146,752,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11182/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,146,944,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11183/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=2,147,136,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11184/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,147,328,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11185/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=2,147,520,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11186/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,147,712,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11187/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,147,904,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11188/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=2,148,096,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11189/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,148,288,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11190/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,148,480,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11191/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,148,672,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11192/500000]
+ train/ActionNoiseL2Loss=0.0306
+ throughput/total_tokens=2,148,864,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11193/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,149,056,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11194/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,149,248,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11195/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,149,440,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11196/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,149,632,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11197/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,149,824,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11198/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,150,016,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11199/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,150,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11200/500000]
+ optim/total_grad_norm=0.9229
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=2,150,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11201/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,150,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11202/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,150,784,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11203/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,150,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11204/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,151,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11205/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=2,151,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11206/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=2,151,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11207/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,151,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11208/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,151,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11209/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,152,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11210/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=2,152,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11211/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=2,152,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11212/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,152,704,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11213/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,152,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11214/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,153,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11215/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,153,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11216/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,153,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11217/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,153,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11218/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=2,153,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11219/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=2,154,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11220/500000]
+ optim/total_grad_norm=1.306
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,154,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11221/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=2,154,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11222/500000]
+ train/ActionNoiseL2Loss=0.0122
+ throughput/total_tokens=2,154,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11223/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=2,154,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11224/500000]
+ train/ActionNoiseL2Loss=0.0127
+ throughput/total_tokens=2,155,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11225/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,155,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11226/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=2,155,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11227/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=2,155,584,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11228/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=2,155,776,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11229/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=2,155,968,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11230/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=2,156,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11231/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,156,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11232/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=2,156,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11233/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,156,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11234/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,156,928,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11235/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,157,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11236/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,157,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11237/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=2,157,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11238/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,157,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11239/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,157,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11240/500000]
+ optim/total_grad_norm=0.9237
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,158,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11241/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,158,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11242/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,158,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11243/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=2,158,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11244/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,158,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11245/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,159,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11246/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,159,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11247/500000]
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=2,159,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11248/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,159,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11249/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,159,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11250/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,160,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11251/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,160,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11252/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,160,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11253/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,160,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11254/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,160,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11255/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,160,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11256/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,161,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11257/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,161,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11258/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=2,161,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11259/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,161,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11260/500000]
+ optim/total_grad_norm=0.9656
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,161,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11261/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,162,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11262/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,162,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11263/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,162,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11264/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,162,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11265/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,162,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11266/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,163,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11267/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=2,163,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11268/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,163,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11269/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=2,163,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11270/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,163,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11271/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=2,164,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11272/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,164,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11273/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,164,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11274/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,164,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11275/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,164,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11276/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,164,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11277/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,165,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11278/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,165,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11279/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,165,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11280/500000]
+ optim/total_grad_norm=0.8713
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,165,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11281/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,165,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11282/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=2,166,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11283/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,166,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11284/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,166,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11285/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,166,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11286/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,166,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11287/500000]
+ train/ActionNoiseL2Loss=0.0100
+ throughput/total_tokens=2,167,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11288/500000]
+ train/ActionNoiseL2Loss=0.0102
+ throughput/total_tokens=2,167,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11289/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,167,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11290/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,167,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11291/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,167,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11292/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,168,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11293/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,168,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11294/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,168,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11295/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,168,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11296/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,168,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11297/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,169,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11298/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=2,169,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11299/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,169,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11300/500000]
+ optim/total_grad_norm=0.7584
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,169,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11301/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,169,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11302/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,169,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11303/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,170,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11304/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,170,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11305/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,170,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11306/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,170,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11307/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=2,170,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11308/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,171,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11309/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,171,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11310/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=2,171,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11311/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,171,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11312/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,171,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11313/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,172,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11314/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,172,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11315/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,172,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11316/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,172,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11317/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,172,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11318/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,173,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11319/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,173,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11320/500000]
+ optim/total_grad_norm=1.045
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,173,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11321/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,173,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11322/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,173,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11323/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,174,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11324/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,174,208,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11325/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,174,400,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11326/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,174,592,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11327/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=2,174,784,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11328/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=2,174,976,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11329/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,175,168,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11330/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,175,360,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11331/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=2,175,552,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11332/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,175,744,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11333/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,175,936,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11334/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,176,128,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11335/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,176,320,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11336/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,176,512,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11337/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,176,704,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11338/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,176,896,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11339/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,177,088,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11340/500000]
+ optim/total_grad_norm=0.7125
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,177,280,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=11341/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,177,472,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11342/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,177,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11343/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,177,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11344/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,178,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11345/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,178,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11346/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,178,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11347/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=2,178,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11348/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,178,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11349/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,179,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11350/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,179,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11351/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,179,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11352/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,179,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11353/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,179,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11354/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,179,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11355/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,180,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11356/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,180,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11357/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=2,180,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11358/500000]
+ train/ActionNoiseL2Loss=0.0084
+ throughput/total_tokens=2,180,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11359/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,180,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11360/500000]
+ optim/total_grad_norm=1.462
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=2,181,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11361/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=2,181,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11362/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,181,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11363/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,181,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11364/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,181,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11365/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,182,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11366/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=2,182,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11367/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,182,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11368/500000]
+ train/ActionNoiseL2Loss=0.0151
+ throughput/total_tokens=2,182,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11369/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=2,182,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11370/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,183,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11371/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=2,183,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11372/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,183,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11373/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=2,183,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11374/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,183,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11375/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,184,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11376/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,184,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11377/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,184,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11378/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,184,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11379/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,184,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11380/500000]
+ optim/total_grad_norm=1.051
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,184,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11381/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,185,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11382/500000]
+ train/ActionNoiseL2Loss=0.0226
+ throughput/total_tokens=2,185,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11383/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,185,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11384/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,185,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11385/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,185,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11386/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,186,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11387/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,186,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11388/500000]
+ train/ActionNoiseL2Loss=0.0113
+ throughput/total_tokens=2,186,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11389/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,186,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11390/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=2,186,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11391/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,187,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11392/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,187,264,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11393/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,187,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11394/500000]
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=2,187,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11395/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=2,187,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11396/500000]
+ train/ActionNoiseL2Loss=0.0180
+ throughput/total_tokens=2,188,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11397/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=2,188,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11398/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,188,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11399/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,188,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11400/500000]
+ optim/total_grad_norm=0.7479
+ train/ActionNoiseL2Loss=0.0150
+ throughput/total_tokens=2,188,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11401/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=2,188,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11402/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,189,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11403/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=2,189,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11404/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,189,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11405/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,189,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11406/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,189,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11407/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,190,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11408/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,190,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11409/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,190,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11410/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=2,190,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11411/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,190,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11412/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,191,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11413/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,191,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11414/500000]
+ train/ActionNoiseL2Loss=0.0098
+ throughput/total_tokens=2,191,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11415/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,191,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11416/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,191,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11417/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,192,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11418/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,192,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11419/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,192,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11420/500000]
+ optim/total_grad_norm=1.328
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=2,192,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11421/500000]
+ train/ActionNoiseL2Loss=0.0126
+ throughput/total_tokens=2,192,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11422/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=2,193,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11423/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,193,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11424/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,193,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11425/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,193,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11426/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,193,792,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11427/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,193,984,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11428/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=2,194,176,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11429/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,194,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11430/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,194,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11431/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,194,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11432/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,194,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11433/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=2,195,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11434/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,195,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11435/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=2,195,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11436/500000]
+ train/ActionNoiseL2Loss=0.0090
+ throughput/total_tokens=2,195,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11437/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,195,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11438/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,196,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11439/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,196,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11440/500000]
+ optim/total_grad_norm=0.7146
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,196,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11441/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=2,196,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11442/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,196,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11443/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,197,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11444/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,197,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11445/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,197,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11446/500000]
+ train/ActionNoiseL2Loss=0.0099
+ throughput/total_tokens=2,197,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11447/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,197,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11448/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,198,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11449/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,198,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11450/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=2,198,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11451/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,198,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11452/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,198,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11453/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,198,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11454/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=2,199,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11455/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,199,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11456/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,199,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11457/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=2,199,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11458/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=2,199,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11459/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=2,200,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11460/500000]
+ optim/total_grad_norm=0.9508
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,200,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11461/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,200,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11462/500000]
+ train/ActionNoiseL2Loss=0.0100
+ throughput/total_tokens=2,200,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11463/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,200,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11464/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,201,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11465/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=2,201,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11466/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,201,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11467/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,201,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11468/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=2,201,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11469/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,202,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11470/500000]
+ train/ActionNoiseL2Loss=0.0123
+ throughput/total_tokens=2,202,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11471/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,202,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11472/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,202,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11473/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,202,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11474/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,203,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11475/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,203,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11476/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,203,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11477/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,203,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11478/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,203,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11479/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=2,203,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11480/500000]
+ optim/total_grad_norm=0.9640
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,204,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11481/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,204,352,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11482/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,204,544,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11483/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,204,736,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11484/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,204,928,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11485/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,205,120,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11486/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=2,205,312,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11487/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,205,504,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11488/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=2,205,696,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11489/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,205,888,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11490/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,206,080,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11491/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=2,206,272,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11492/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=2,206,464,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11493/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=2,206,656,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11494/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,206,848,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11495/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,207,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11496/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=2,207,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11497/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=2,207,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11498/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,207,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11499/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,207,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11500/500000]
+ optim/total_grad_norm=0.9338
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,208,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/05 [12:49:20] INFO | >> Saving config... checkpoint.py:608
+10/05 [12:49:54] INFO | >> Saving model state... checkpoint.py:796
+10/05 [12:51:08] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [12:52:41] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11501/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=2,208,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11502/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,208,384,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=11503/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,208,576,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=11504/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=2,208,768,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=11505/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,208,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=11506/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=2,209,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=11507/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,209,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11508/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,209,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11509/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=2,209,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11510/500000]
+ train/ActionNoiseL2Loss=0.0166
+ throughput/total_tokens=2,209,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11511/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=2,210,112,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11512/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,210,304,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11513/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,210,496,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11514/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=2,210,688,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11515/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=2,210,880,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11516/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,211,072,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11517/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=2,211,264,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11518/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=2,211,456,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11519/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,211,648,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11520/500000]
+ optim/total_grad_norm=0.6644
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,211,840,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11521/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,212,032,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11522/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,212,224,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11523/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,212,416,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11524/500000]
+ train/ActionNoiseL2Loss=0.0136
+ throughput/total_tokens=2,212,608,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11525/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=2,212,800,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11526/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=2,212,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11527/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,213,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11528/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,213,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11529/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,213,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11530/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,213,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11531/500000]
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=2,213,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11532/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,214,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11533/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,214,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11534/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,214,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11535/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,214,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11536/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,214,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11537/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=2,215,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11538/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=2,215,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11539/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,215,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11540/500000]
+ optim/total_grad_norm=1.117
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,215,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11541/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=2,215,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11542/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=2,216,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11543/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=2,216,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11544/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=2,216,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11545/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,216,640,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11546/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,216,832,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11547/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=2,217,024,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11548/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=2,217,216,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11549/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,217,408,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11550/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=2,217,600,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11551/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=2,217,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11552/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,217,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11553/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=2,218,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11554/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,218,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11555/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,218,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11556/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,218,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11557/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,218,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11558/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,219,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11559/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=2,219,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11560/500000]
+ optim/total_grad_norm=0.9331
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,219,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=11561/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,219,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11562/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,219,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11563/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=2,220,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11564/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,220,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11565/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=2,220,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11566/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=2,220,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11567/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,220,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11568/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=2,221,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11569/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,221,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11570/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=2,221,440,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11571/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=2,221,632,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11572/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=2,221,824,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11573/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,222,016,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11574/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=2,222,208,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11575/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,222,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11576/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=2,222,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11577/500000]
+ train/ActionNoiseL2Loss=0.0175
+ throughput/total_tokens=2,222,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11578/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,222,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11579/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,223,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11580/500000]
+ optim/total_grad_norm=1.333
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,223,360,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11581/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,223,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11582/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,223,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11583/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,223,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11584/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,224,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11585/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,224,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11586/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,224,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11587/500000]
+ train/ActionNoiseL2Loss=0.0139
+ throughput/total_tokens=2,224,704,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11588/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=2,224,896,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11589/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,225,088,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11590/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,225,280,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11591/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,225,472,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11592/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,225,664,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11593/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,225,856,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11594/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,226,048,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11595/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,226,240,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11596/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,226,432,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11597/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,226,624,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11598/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=2,226,816,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11599/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=2,227,008,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11600/500000]
+ optim/total_grad_norm=1.032
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,227,200,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11601/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=2,227,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11602/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,227,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11603/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=2,227,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11604/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,227,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11605/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,228,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11606/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,228,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11607/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,228,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11608/500000]
+ train/ActionNoiseL2Loss=0.0147
+ throughput/total_tokens=2,228,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11609/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,228,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11610/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,229,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11611/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=2,229,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11612/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,229,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11613/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,229,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11614/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=2,229,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11615/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,230,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11616/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,230,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11617/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=2,230,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11618/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,230,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11619/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=2,230,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11620/500000]
+ optim/total_grad_norm=0.9398
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,231,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11621/500000]
+ train/ActionNoiseL2Loss=0.0153
+ throughput/total_tokens=2,231,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11622/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=2,231,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11623/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,231,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11624/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,231,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11625/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=2,232,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11626/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=2,232,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11627/500000]
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,232,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11628/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=2,232,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11629/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,232,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11630/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,232,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11631/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,233,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11632/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=2,233,344,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11633/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,233,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11634/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,233,728,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11635/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,233,920,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11636/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,234,112,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11637/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,234,304,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11638/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,234,496,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11639/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,234,688,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11640/500000]
+ optim/total_grad_norm=1.663
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=2,234,880,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11641/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=2,235,072,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11642/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=2,235,264,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11643/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=2,235,456,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11644/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,235,648,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11645/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,235,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11646/500000]
+ train/ActionNoiseL2Loss=0.0191
+ throughput/total_tokens=2,236,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11647/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,236,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11648/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=2,236,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11649/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=2,236,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11650/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,236,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11651/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,236,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11652/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,237,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11653/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,237,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11654/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,237,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11655/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,237,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11656/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,237,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11657/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=2,238,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11658/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,238,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11659/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,238,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11660/500000]
+ optim/total_grad_norm=1.428
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,238,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=11661/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,238,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11662/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,239,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11663/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=2,239,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11664/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,239,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11665/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,239,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11666/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,239,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11667/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,240,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11668/500000]
+ train/ActionNoiseL2Loss=0.0128
+ throughput/total_tokens=2,240,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11669/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,240,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11670/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,240,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11671/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=2,240,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11672/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,241,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11673/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,241,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11674/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,241,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11675/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,241,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11676/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,241,792,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11677/500000]
+ train/ActionNoiseL2Loss=0.0131
+ throughput/total_tokens=2,241,984,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11678/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,242,176,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11679/500000]
+ train/ActionNoiseL2Loss=0.0149
+ throughput/total_tokens=2,242,368,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11680/500000]
+ optim/total_grad_norm=0.8076
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,242,560,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11681/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,242,752,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11682/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,242,944,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11683/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,243,136,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11684/500000]
+ train/ActionNoiseL2Loss=0.0119
+ throughput/total_tokens=2,243,328,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11685/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=2,243,520,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11686/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=2,243,712,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11687/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,243,904,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11688/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=2,244,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11689/500000]
+ train/ActionNoiseL2Loss=0.0195
+ throughput/total_tokens=2,244,288,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11690/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,244,480,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11691/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,244,672,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11692/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,244,864,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11693/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,245,056,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11694/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,245,248,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11695/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,245,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11696/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,245,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11697/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,245,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11698/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,246,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11699/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=2,246,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11700/500000]
+ optim/total_grad_norm=1.135
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,246,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11701/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,246,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11702/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,246,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11703/500000]
+ train/ActionNoiseL2Loss=0.0163
+ throughput/total_tokens=2,246,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11704/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,247,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11705/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,247,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11706/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=2,247,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11707/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=2,247,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11708/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,247,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11709/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,248,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11710/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=2,248,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,467
+[step=11711/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,248,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11712/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=2,248,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11713/500000]
+ train/ActionNoiseL2Loss=0.0162
+ throughput/total_tokens=2,248,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11714/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,249,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11715/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=2,249,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11716/500000]
+ train/ActionNoiseL2Loss=0.0083
+ throughput/total_tokens=2,249,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11717/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,249,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11718/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,249,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11719/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,250,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11720/500000]
+ optim/total_grad_norm=0.6764
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=2,250,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11721/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,250,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11722/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,250,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11723/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,250,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11724/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,251,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11725/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,251,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11726/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=2,251,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11727/500000]
+ train/ActionNoiseL2Loss=0.0141
+ throughput/total_tokens=2,251,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11728/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,251,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11729/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=2,251,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11730/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,252,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11731/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,252,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11732/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,252,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11733/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,252,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11734/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=2,252,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11735/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,253,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11736/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,253,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11737/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=2,253,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11738/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,253,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11739/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,253,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11740/500000]
+ optim/total_grad_norm=1.220
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,254,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11741/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,254,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11742/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,254,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11743/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,254,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11744/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=2,254,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11745/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,255,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11746/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,255,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11747/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,255,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11748/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,255,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11749/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,255,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11750/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,256,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11751/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,256,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11752/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=2,256,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11753/500000]
+ train/ActionNoiseL2Loss=0.0213
+ throughput/total_tokens=2,256,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11754/500000]
+ train/ActionNoiseL2Loss=0.0087
+ throughput/total_tokens=2,256,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11755/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=2,256,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11756/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,257,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11757/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,257,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11758/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=2,257,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11759/500000]
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=2,257,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11760/500000]
+ optim/total_grad_norm=0.7258
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=2,257,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11761/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,258,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11762/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=2,258,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11763/500000]
+ train/ActionNoiseL2Loss=0.0106
+ throughput/total_tokens=2,258,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11764/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,258,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11765/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,258,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11766/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,259,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11767/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,259,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11768/500000]
+ train/ActionNoiseL2Loss=0.0161
+ throughput/total_tokens=2,259,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11769/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=2,259,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11770/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,259,840,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11771/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=2,260,032,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11772/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,260,224,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11773/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=2,260,416,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11774/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=2,260,608,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11775/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=2,260,800,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11776/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=2,260,992,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11777/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,261,184,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11778/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,261,376,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11779/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=2,261,568,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11780/500000]
+ optim/total_grad_norm=1.041
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,261,760,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11781/500000]
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,261,952,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11782/500000]
+ train/ActionNoiseL2Loss=0.0107
+ throughput/total_tokens=2,262,144,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11783/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=2,262,336,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=11784/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=2,262,528,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11785/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=2,262,720,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11786/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,262,912,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11787/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,263,104,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11788/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,263,296,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11789/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,263,488,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11790/500000]
+ train/ActionNoiseL2Loss=0.1310
+ throughput/total_tokens=2,263,680,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11791/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,263,872,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11792/500000]
+ train/ActionNoiseL2Loss=0.0198
+ throughput/total_tokens=2,264,064,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11793/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=2,264,256,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11794/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,264,448,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11795/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,264,640,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11796/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=2,264,832,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11797/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,265,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11798/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,265,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11799/500000]
+ train/ActionNoiseL2Loss=0.0159
+ throughput/total_tokens=2,265,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11800/500000]
+ optim/total_grad_norm=1.362
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,265,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11801/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,265,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11802/500000]
+ train/ActionNoiseL2Loss=0.0190
+ throughput/total_tokens=2,265,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11803/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,266,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11804/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=2,266,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11805/500000]
+ train/ActionNoiseL2Loss=0.0118
+ throughput/total_tokens=2,266,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11806/500000]
+ train/ActionNoiseL2Loss=0.0148
+ throughput/total_tokens=2,266,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11807/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,266,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11808/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,267,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11809/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=2,267,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11810/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,267,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11811/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,267,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11812/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=2,267,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11813/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=2,268,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11814/500000]
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,268,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11815/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,268,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11816/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=2,268,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11817/500000]
+ train/ActionNoiseL2Loss=0.0204
+ throughput/total_tokens=2,268,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11818/500000]
+ train/ActionNoiseL2Loss=0.0152
+ throughput/total_tokens=2,269,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11819/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,269,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11820/500000]
+ optim/total_grad_norm=0.7745
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=2,269,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11821/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,269,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11822/500000]
+ train/ActionNoiseL2Loss=0.0168
+ throughput/total_tokens=2,269,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11823/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,270,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11824/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=2,270,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11825/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,270,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11826/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,270,592,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11827/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,270,784,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11828/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,270,976,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11829/500000]
+ train/ActionNoiseL2Loss=0.0215
+ throughput/total_tokens=2,271,168,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11830/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,271,360,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11831/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,271,552,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11832/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=2,271,744,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11833/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,271,936,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11834/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,272,128,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11835/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,272,320,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11836/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,272,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11837/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,272,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11838/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,272,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11839/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,273,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11840/500000]
+ optim/total_grad_norm=1.477
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,273,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11841/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,273,472,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11842/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,273,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11843/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,273,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11844/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,274,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11845/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,274,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11846/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=2,274,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11847/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=2,274,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11848/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,274,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11849/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=2,275,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11850/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=2,275,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11851/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,275,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11852/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=2,275,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11853/500000]
+ train/ActionNoiseL2Loss=0.0117
+ throughput/total_tokens=2,275,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11854/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,275,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11855/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,276,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11856/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,276,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11857/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=2,276,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11858/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,276,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11859/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,276,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11860/500000]
+ optim/total_grad_norm=1.040
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=2,277,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11861/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,277,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11862/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=2,277,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11863/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,277,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11864/500000]
+ train/ActionNoiseL2Loss=0.1535
+ throughput/total_tokens=2,277,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11865/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,278,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11866/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,278,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11867/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,278,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11868/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,278,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11869/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,278,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11870/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,279,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11871/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,279,232,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11872/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,279,424,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11873/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,279,616,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11874/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,279,808,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11875/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=2,280,000,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11876/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,280,192,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11877/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,280,384,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11878/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,280,576,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11879/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=2,280,768,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11880/500000]
+ optim/total_grad_norm=0.9308
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=2,280,960,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11881/500000]
+ train/ActionNoiseL2Loss=0.0146
+ throughput/total_tokens=2,281,152,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11882/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,281,344,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11883/500000]
+ train/ActionNoiseL2Loss=0.0205
+ throughput/total_tokens=2,281,536,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11884/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=2,281,728,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11885/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,281,920,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11886/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=2,282,112,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11887/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,282,304,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11888/500000]
+ train/ActionNoiseL2Loss=0.0125
+ throughput/total_tokens=2,282,496,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11889/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,282,688,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11890/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,282,880,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11891/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,283,072,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11892/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,283,264,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11893/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=2,283,456,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11894/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,283,648,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11895/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,283,840,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11896/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,284,032,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11897/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,284,224,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11898/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=2,284,416,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11899/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,284,608,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11900/500000]
+ optim/total_grad_norm=0.9174
+ train/ActionNoiseL2Loss=0.0236
+ throughput/total_tokens=2,284,800,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11901/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,284,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11902/500000]
+ train/ActionNoiseL2Loss=0.0181
+ throughput/total_tokens=2,285,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11903/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=2,285,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11904/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=2,285,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11905/500000]
+ train/ActionNoiseL2Loss=0.0112
+ throughput/total_tokens=2,285,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11906/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,285,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11907/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,286,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11908/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,286,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11909/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,286,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11910/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,286,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11911/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,286,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11912/500000]
+ train/ActionNoiseL2Loss=0.0137
+ throughput/total_tokens=2,287,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11913/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=2,287,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11914/500000]
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=2,287,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11915/500000]
+ train/ActionNoiseL2Loss=0.0196
+ throughput/total_tokens=2,287,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11916/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,287,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11917/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,288,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11918/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=2,288,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11919/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,288,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11920/500000]
+ optim/total_grad_norm=0.8476
+ train/ActionNoiseL2Loss=0.0109
+ throughput/total_tokens=2,288,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11921/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,288,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11922/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,289,024,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11923/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,289,216,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11924/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=2,289,408,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11925/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,289,600,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11926/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=2,289,792,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11927/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=2,289,984,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11928/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,290,176,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=11929/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,290,368,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11930/500000]
+ train/ActionNoiseL2Loss=0.0160
+ throughput/total_tokens=2,290,560,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11931/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,290,752,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11932/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,290,944,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11933/500000]
+ train/ActionNoiseL2Loss=0.0171
+ throughput/total_tokens=2,291,136,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11934/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,291,328,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11935/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=2,291,520,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11936/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,291,712,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11937/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,291,904,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11938/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=2,292,096,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11939/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,292,288,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11940/500000]
+ optim/total_grad_norm=0.6581
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,292,480,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11941/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,292,672,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11942/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,292,864,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11943/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=2,293,056,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11944/500000]
+ train/ActionNoiseL2Loss=0.0214
+ throughput/total_tokens=2,293,248,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11945/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,293,440,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11946/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=2,293,632,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11947/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,293,824,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11948/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,294,016,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11949/500000]
+ train/ActionNoiseL2Loss=0.0115
+ throughput/total_tokens=2,294,208,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11950/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,294,400,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11951/500000]
+ train/ActionNoiseL2Loss=0.0140
+ throughput/total_tokens=2,294,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11952/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=2,294,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11953/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,294,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11954/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,295,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11955/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,295,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11956/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=2,295,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11957/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,295,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11958/500000]
+ train/ActionNoiseL2Loss=0.0104
+ throughput/total_tokens=2,295,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11959/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,296,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11960/500000]
+ optim/total_grad_norm=1.200
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,296,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=11961/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,296,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11962/500000]
+ train/ActionNoiseL2Loss=0.0094
+ throughput/total_tokens=2,296,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11963/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,296,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11964/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,297,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11965/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=2,297,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11966/500000]
+ train/ActionNoiseL2Loss=0.0194
+ throughput/total_tokens=2,297,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11967/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,297,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11968/500000]
+ train/ActionNoiseL2Loss=0.0170
+ throughput/total_tokens=2,297,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11969/500000]
+ train/ActionNoiseL2Loss=0.0116
+ throughput/total_tokens=2,298,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11970/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,298,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11971/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,298,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11972/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,298,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11973/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,298,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11974/500000]
+ train/ActionNoiseL2Loss=0.0113
+ throughput/total_tokens=2,299,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11975/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,299,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11976/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=2,299,392,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11977/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,299,584,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11978/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=2,299,776,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11979/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,299,968,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11980/500000]
+ optim/total_grad_norm=1.259
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,300,160,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11981/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,300,352,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11982/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,300,544,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11983/500000]
+ train/ActionNoiseL2Loss=0.0212
+ throughput/total_tokens=2,300,736,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11984/500000]
+ train/ActionNoiseL2Loss=0.0113
+ throughput/total_tokens=2,300,928,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11985/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,301,120,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11986/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,301,312,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11987/500000]
+ train/ActionNoiseL2Loss=0.0112
+ throughput/total_tokens=2,301,504,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11988/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=2,301,696,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11989/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,301,888,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11990/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=2,302,080,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=11991/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,302,272,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11992/500000]
+ train/ActionNoiseL2Loss=0.0132
+ throughput/total_tokens=2,302,464,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11993/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=2,302,656,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11994/500000]
+ train/ActionNoiseL2Loss=0.0124
+ throughput/total_tokens=2,302,848,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11995/500000]
+ train/ActionNoiseL2Loss=0.0192
+ throughput/total_tokens=2,303,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11996/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=2,303,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11997/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,303,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11998/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=2,303,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=11999/500000]
+ train/ActionNoiseL2Loss=0.0135
+ throughput/total_tokens=2,303,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12000/500000]
+ optim/total_grad_norm=0.9185
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,304,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+10/05 [15:47:38] INFO | >> Saving config... checkpoint.py:608
+10/05 [15:48:13] INFO | >> Saving model state... checkpoint.py:796
+10/05 [15:49:23] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [15:50:50] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=12001/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,304,192,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0496
+[step=12002/500000]
+ train/ActionNoiseL2Loss=0.0167
+ throughput/total_tokens=2,304,384,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=12003/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,304,576,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=12004/500000]
+ train/ActionNoiseL2Loss=0.0164
+ throughput/total_tokens=2,304,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=12005/500000]
+ train/ActionNoiseL2Loss=0.0173
+ throughput/total_tokens=2,304,960,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=12006/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=2,305,152,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0483
+[step=12007/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,305,344,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12008/500000]
+ train/ActionNoiseL2Loss=0.0176
+ throughput/total_tokens=2,305,536,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12009/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,305,728,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12010/500000]
+ train/ActionNoiseL2Loss=0.0183
+ throughput/total_tokens=2,305,920,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+ System/Peak GPU Memory (MB)=46,467
+[step=12011/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,306,112,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=12012/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=2,306,304,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=12013/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,306,496,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=12014/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=2,306,688,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=12015/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,306,880,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=12016/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,307,072,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=12017/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,307,264,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=12018/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=2,307,456,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=12019/500000]
+ train/ActionNoiseL2Loss=0.0154
+ throughput/total_tokens=2,307,648,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=12020/500000]
+ optim/total_grad_norm=1.746
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,307,840,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12021/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,308,032,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12022/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,308,224,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12023/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=2,308,416,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12024/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,308,608,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12025/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,308,800,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12026/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,308,992,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12027/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,309,184,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12028/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=2,309,376,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12029/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=2,309,568,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12030/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=2,309,760,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12031/500000]
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=2,309,952,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12032/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,310,144,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12033/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,310,336,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12034/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,310,528,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12035/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,310,720,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12036/500000]
+ train/ActionNoiseL2Loss=0.0200
+ throughput/total_tokens=2,310,912,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12037/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,311,104,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12038/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,311,296,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12039/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,311,488,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12040/500000]
+ optim/total_grad_norm=0.8163
+ train/ActionNoiseL2Loss=0.0120
+ throughput/total_tokens=2,311,680,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12041/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=2,311,872,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12042/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,312,064,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12043/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=2,312,256,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12044/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,312,448,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12045/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,312,640,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12046/500000]
+ train/ActionNoiseL2Loss=0.0098
+ throughput/total_tokens=2,312,832,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12047/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,313,024,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12048/500000]
+ train/ActionNoiseL2Loss=0.0174
+ throughput/total_tokens=2,313,216,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12049/500000]
+ train/ActionNoiseL2Loss=0.0143
+ throughput/total_tokens=2,313,408,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12050/500000]
+ train/ActionNoiseL2Loss=0.0118
+ throughput/total_tokens=2,313,600,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12051/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,313,792,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12052/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=2,313,984,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12053/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=2,314,176,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12054/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,314,368,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12055/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,314,560,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12056/500000]
+ train/ActionNoiseL2Loss=0.0189
+ throughput/total_tokens=2,314,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12057/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,314,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12058/500000]
+ train/ActionNoiseL2Loss=0.0130
+ throughput/total_tokens=2,315,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12059/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=2,315,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12060/500000]
+ optim/total_grad_norm=0.7221
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,315,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=12061/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,315,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12062/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,315,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12063/500000]
+ train/ActionNoiseL2Loss=0.0169
+ throughput/total_tokens=2,316,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12064/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,316,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12065/500000]
+ train/ActionNoiseL2Loss=0.0156
+ throughput/total_tokens=2,316,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12066/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=2,316,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12067/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,316,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12068/500000]
+ train/ActionNoiseL2Loss=0.0145
+ throughput/total_tokens=2,317,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12069/500000]
+ train/ActionNoiseL2Loss=0.0107
+ throughput/total_tokens=2,317,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12070/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,317,440,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12071/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,317,632,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12072/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,317,824,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12073/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,318,016,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12074/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,318,208,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12075/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,318,400,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12076/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,318,592,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12077/500000]
+ train/ActionNoiseL2Loss=0.0142
+ throughput/total_tokens=2,318,784,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12078/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=2,318,976,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12079/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,319,168,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12080/500000]
+ optim/total_grad_norm=0.8219
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=2,319,360,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12081/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=2,319,552,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12082/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=2,319,744,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12083/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,319,936,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12084/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=2,320,128,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12085/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,320,320,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=12086/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,320,512,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12087/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=2,320,704,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12088/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,320,896,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12089/500000]
+ train/ActionNoiseL2Loss=0.0178
+ throughput/total_tokens=2,321,088,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12090/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=2,321,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12091/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=2,321,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12092/500000]
+ train/ActionNoiseL2Loss=0.0157
+ throughput/total_tokens=2,321,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12093/500000]
+ train/ActionNoiseL2Loss=0.0138
+ throughput/total_tokens=2,321,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12094/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=2,322,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12095/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,322,240,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12096/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,322,432,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12097/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,322,624,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12098/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,322,816,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12099/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=2,323,008,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12100/500000]
+ optim/total_grad_norm=1.916
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=2,323,200,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12101/500000]
+ train/ActionNoiseL2Loss=0.0219
+ throughput/total_tokens=2,323,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12102/500000]
+ train/ActionNoiseL2Loss=0.0231
+ throughput/total_tokens=2,323,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12103/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=2,323,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12104/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=2,323,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12105/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,324,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12106/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,324,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12107/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,324,544,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12108/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=2,324,736,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12109/500000]
+ train/ActionNoiseL2Loss=0.0179
+ throughput/total_tokens=2,324,928,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12110/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=2,325,120,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=46,467
+[step=12111/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=2,325,312,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12112/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=2,325,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12113/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=2,325,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12114/500000]
+ train/ActionNoiseL2Loss=0.0187
+ throughput/total_tokens=2,325,888,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12115/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=2,326,080,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12116/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,326,272,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12117/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=2,326,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12118/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,326,656,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12119/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,326,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=12120/500000]
+ optim/total_grad_norm=0.8645
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=2,327,040,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12121/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,327,232,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12122/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,327,424,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12123/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,327,616,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12124/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,327,808,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12125/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,328,000,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12126/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=2,328,192,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12127/500000]
+ train/ActionNoiseL2Loss=0.0172
+ throughput/total_tokens=2,328,384,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12128/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,328,576,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12129/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=2,328,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=12130/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=2,328,960,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,467
+[step=12131/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,329,152,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
diff --git a/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/files/requirements.txt b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8
--- /dev/null
+++ b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/files/requirements.txt
@@ -0,0 +1,286 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+et_xmlfile==2.0.0
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+openpyxl==3.1.5
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/files/wandb-metadata.json b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..76f41c76025b39d9b5566488840b71a26ba61c93
--- /dev/null
+++ b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-10-02T16:37:28.959576Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue_flow_matching",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "1600",
+ "--ft_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "16",
+ "--global_batch_size",
+ "126",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--real_world_vla_config_path",
+ "vla_config_realworld/vla_config_glue.yaml",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "5071f59d87c6a976691323cbac66d7a988b0b4e7"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue_flow_matching/wandb",
+ "host": "auh7-1b-gpu-260",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "56243757056"
+ }
+ },
+ "memory": {
+ "total": "2434606956544"
+ },
+ "gpu_amd": [
+ {
+ "id": "2",
+ "uniqueId": "0x9815965a899d8053",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0x2d75dae36f0dc353",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0x702e8efb76b00c21",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0xd79d4a081e34548d",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0xe35cdba2e3fafd21",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0xd7a6e11358a6574d",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0x4493708eee1ee737",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x4213cc9eeeefc98d",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1759682204",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "2277",
+ "job_name": "mh_glue_flow_matching",
+ "job_nodelist": "auh7-1b-gpu-260",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1759423004",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "2277",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-260",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "2574600",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-260",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "bkls6pwuvb5z6spobbikig7vp96dw2y9"
+}
\ No newline at end of file
diff --git a/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/logs/debug-core.log b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..2bff196e2fe2e6f5c67217603bdc9f341c8b9479
--- /dev/null
+++ b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/logs/debug-core.log
@@ -0,0 +1,12 @@
+{"time":"2025-10-02T16:37:29.014245666Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpusl77j3_/port-2574789.txt","pid":2574789,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-10-02T16:37:29.016062848Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":2574789}
+{"time":"2025-10-02T16:37:29.016006867Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2574789-2574955-4107859315/socket","Net":"unix"}}
+{"time":"2025-10-02T16:37:29.198285234Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-10-02T16:37:29.205734663Z","level":"INFO","msg":"handleInformInit: received","streamId":"tmwli25x","id":"1(@)"}
+{"time":"2025-10-02T16:37:30.340260012Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"tmwli25x","id":"1(@)"}
+.txt","pid":3780083,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-10-02T16:37:29.282444644Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3780083}
+{"time":"2025-10-02T16:37:29.282434424Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3780083-3780247-3093816148/socket","Net":"unix"}}
+{"time":"2025-10-02T16:37:29.458879988Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-10-02T16:37:29.465619355Z","level":"INFO","msg":"handleInformInit: received","streamId":"7ovz4jzt","id":"1(@)"}
+{"time":"2025-10-02T16:37:30.493288413Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"7ovz4jzt","id":"1(@)"}
diff --git a/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/logs/debug-internal.log b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..b6f233979d8d54643d262152a9e875cadf5086d3
--- /dev/null
+++ b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/logs/debug-internal.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:37:29.207693207Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-02T16:37:30.340213302Z","level":"INFO","msg":"stream: created new stream","id":"tmwli25x"}
+{"time":"2025-10-02T16:37:30.340254592Z","level":"INFO","msg":"stream: started","id":"tmwli25x"}
+{"time":"2025-10-02T16:37:30.340274553Z","level":"INFO","msg":"writer: started","stream_id":"tmwli25x"}
+{"time":"2025-10-02T16:37:30.340287593Z","level":"INFO","msg":"handler: started","stream_id":"tmwli25x"}
+{"time":"2025-10-02T16:37:30.340319673Z","level":"INFO","msg":"sender: started","stream_id":"tmwli25x"}
diff --git a/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/logs/debug.log b/glue_flow_matching/wandb/wandb/run-20251002_163728-tmwli25x/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/glue_l1_regression/step12000-unsharded/config.yaml b/glue_l1_regression/step12000-unsharded/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..b5bf061fe266462b20a2186e4e0e3213b49ad5a3
--- /dev/null
+++ b/glue_l1_regression/step12000-unsharded/config.yaml
@@ -0,0 +1,322 @@
+run_name: glue_20251002_163658
+seed: 6198
+epoch: null
+dry_run: false
+model:
+ d_model: 3584
+ n_heads: 28
+ n_kv_heads: 4
+ qkv_bias: true
+ clip_qkv: null
+ n_layers: 28
+ mlp_ratio: 4
+ mlp_hidden_size: 37888
+ activation_type: swiglu
+ block_type: sequential
+ block_group_size: 1
+ rope: true
+ rope_full_precision: true
+ rope_theta: 1000000.0
+ vision_backbone:
+ image_model_type: openai
+ image_default_input_size:
+ - 336
+ - 336
+ image_patch_size: 14
+ image_pos_patch_size: 14
+ image_emb_dim: 1024
+ image_num_heads: 16
+ image_num_key_value_heads: 16
+ image_num_layers: 23
+ image_head_dim: 64
+ image_mlp_dim: 4096
+ image_mlp_activations: quick_gelu
+ image_dropout_rate: 0.0
+ image_num_pos: 577
+ image_norm_eps: 1.0e-05
+ attention_dropout: 0.0
+ residual_dropout: 0.0
+ initializer_range: 0.02
+ fsdp_wrap: false
+ resize_mode: default
+ vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt
+ llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt
+ low_cpu_fsdp: true
+ attention_type: sdpa
+ float32_attention: true
+ attention_dropout: 0.0
+ attention_layer_norm: false
+ residual_dropout: 0.1
+ response_residual_dropout: 0.0
+ embedding_dropout: 0.0
+ layer_norm_type: rms
+ layer_norm_with_affine: true
+ layer_norm_eps: 1.0e-06
+ attention_layer_norm_with_affine: true
+ max_sequence_length: 4096
+ max_position_embeddings: null
+ include_bias: false
+ bias_for_layer_norm: null
+ scale_logits: false
+ vocab_size: 152064
+ embedding_size: 152064
+ ff_out_size: null
+ additional_vocab_size: 128
+ new_embedding_init_range: 0.02
+ weight_tying: false
+ init_device: null
+ init_fn: normal
+ init_std: 0.02
+ init_cutoff_factor: null
+ norm_after: false
+ precision: amp_bf16
+ max_crops: 12
+ crop_mode: overlap-and-resize-c2
+ use_col_tokens: true
+ prompt_type: uber_model
+ system_prompt_kind: demo_or_style
+ message_formatting: role
+ always_start_with_space: true
+ multi_annotation_weighting: root_subsegments
+ default_inference_len: 65
+ overlap_margins:
+ - 4
+ - 4
+ pad_value: 0.0
+ image_padding_embed: pad_and_partial_pad
+ fix_image_padding: true
+ vit_layers:
+ - -2
+ - -9
+ image_pooling_h: 2
+ image_pooling_w: 2
+ image_pooling_2d: attention_meanq
+ image_projector: mlp
+ image_feature_dropout: 0.0
+ initializer_range: 0.02
+ normalize_input_embeds: false
+ use_position_ids: true
+ head_dim: null
+ action_tokenizer:
+ identifier: physical-intelligence/fast
+ tokenizer_dir: null
+ action_dim: 7
+ horizon: 8
+ tokenizer:
+ identifier: Qwen/Qwen2-7B
+ tokenizer_dir: null
+ pad_tokenizer: true
+ moe_num_experts: 8
+ moe_top_k: 2
+ moe_mlp_impl: sparse
+ moe_log_expert_assignment: false
+ moe_shared_expert: false
+ moe_lbl_in_fp32: false
+ moe_interleave: false
+ moe_loss_weight: 0.1
+ moe_zloss_weight: null
+ moe_dropless: true
+ moe_capacity_factor: 1.25
+ action_head: l1_regression
+ num_diffusion_steps: 1000
+ num_diffusion_inference_steps: 30
+ use_proprio: true
+ action_head_dit_hidden_size: 1152
+ action_head_dit_depth: 28
+ action_head_dit_num_heads: 16
+ llm_causal_attention: false
+ action_use_left_eef: true
+ action_use_mobile_base: false
+allow_resume: false
+ft_llm: true
+ft_vit: false
+ft_connector: false
+ft_embedding: lm_head
+lora: false
+use_lora: true
+lora_rank: 8
+lora_llm: false
+lora_vit: false
+lora_connector: false
+early_exit: false
+train_exit_random_layer: false
+optimizer:
+ name: adamw
+ learning_rate: 0.0001
+ weight_decay: 0.01
+ betas:
+ - 0.9
+ - 0.95
+ eps: 1.0e-05
+ connector_learning_rate: 0.0002
+ vit_learning_rate: 6.0e-06
+ llm_learning_rate: 5.0e-05
+ connector_weight_decay: 0.0
+ vit_weight_decay: 0.0
+ llm_weight_decay: 0.0
+ connector_betas:
+ - 0.9
+ - 0.95
+ vit_betas:
+ - 0.9
+ - 0.95
+ llm_betas:
+ - 0.9
+ - 0.95
+ connector_eps: 1.0e-06
+ vit_eps: 1.0e-06
+ llm_eps: 1.0e-06
+ metrics_log_interval: 20
+scheduler:
+ name: multimodal
+ units: steps
+ t_warmup: 100
+ t_max: null
+ alpha_f: 0.1
+ connector_t_warmup: 200
+ vit_t_warmup: 2000
+ llm_t_warmup: 2000
+ grad_clip_warmup_steps: null
+ grad_clip_warmup_factor: null
+ warmup_min_lr: 0.0
+data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: train
+ seed: 95818
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: true
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: false
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 100000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: null
+ lerobot_episode_index_end: null
+restore_dataloader: true
+fast_forward_batches: null
+evaluators:
+- label: val
+ data:
+ dataset: vla_dataset_realworld
+ mixture: null
+ root_size_mixture: null
+ split: validation
+ seed: null
+ shuffle_messages: false
+ pad: to_max
+ sequence_length: 1600
+ shuffle: false
+ for_inference: false
+ multi_modal: torch
+ num_workers: 0
+ drop_last: true
+ pin_memory: true
+ prefetch_factor: null
+ persistent_workers: true
+ timeout: 0
+ rlds_dataset_name: libero_4_task_suites_no_noops
+ rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
+ use_wrist_image: true
+ use_proprio: true
+ rlds_shuffle_buffer_size: 256000
+ rlds_traj_threads: 8
+ rlds_read_threads: 8
+ lerobot_episode_index_start: 353
+ lerobot_episode_index_end: 765
+ device_eval_batch_size: null
+ subset_num_batches: 64
+ max_examples: null
+ max_new_tokens: 448
+ mm_evaluator: null
+ save_dir: null
+ save_to_checkpoint_dir: false
+ eval_name: null
+ skip_if_metrics_cached: true
+eval_interval: 0
+inf_eval_interval: -1
+inf_evaluators: []
+save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue_l1_regression
+remote_save_folder: null
+canceled_check_interval: 50
+save_interval: 500
+save_interval_unsharded: 500
+save_interval_ephemeral: null
+save_interval_action_head: 500
+save_num_checkpoints_to_keep: 1
+save_num_unsharded_checkpoints_to_keep: 1
+save_num_action_head_checkpoints_to_keep: 2
+save_overwrite: true
+force_save_unsharded: false
+no_pre_train_checkpoint: true
+initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_model_config: null
+checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924
+load_path: null
+load_path_sharded_checkpointer: null
+reset_optimizer_state: false
+reset_trainer_state: false
+save_dataloader_state: false
+reset_dataloader_state: false
+keep_lr_on_load: true
+sharded_checkpointer: torch_legacy
+max_duration: 500000
+global_train_batch_size: 126
+device_train_batch_size: 15
+device_train_microbatch_size: 16
+device_eval_batch_size: 4
+eval_subset_num_batches: -1
+eval_on_load: false
+device_inf_eval_batch_size: 16
+inf_eval_subset_num_batches: -1
+device_train_grad_accum: 0
+max_grad_norm: 1.0
+multi_component_grad_norm: true
+batch_divisor: global_batch
+max_grad_norm_ratio: null
+precision: amp_bf16
+wandb:
+ project: a1-realworld
+ entity: henryeap
+ group: null
+ name: glue_20251002_163658
+ tags:
+ - watching
+ log_artifacts: false
+ rank_zero_only: true
+ log_interval: 1
+speed_monitor:
+ window_size: 20
+ gpu_flops_available: null
+console_log_interval: 1
+gen1_gc_interval: 1
+compile: null
+fsdp:
+ use_orig_params: true
+ sharding_strategy: FULL_SHARD
+ wrapping_strategy: by_block_and_size
+ precision: float
+ hybrid_sharding_num_model_replicas: null
+softmax_auxiliary_loss: true
+softmax_auxiliary_loss_scale: 0.0001
+time_limit: null
+extra_steps_after_cancel: 10
+python_profiling: false
+torch_profiling: false
+stop_at: 500000
+stop_after: null
+activation_checkpointing: whole_layer
+fused_loss: null
diff --git a/glue_l1_regression/wandb/wandb/debug-internal.log b/glue_l1_regression/wandb/wandb/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..f58c1475f78e716f565c85beed1b416156e7b5e0
--- /dev/null
+++ b/glue_l1_regression/wandb/wandb/debug-internal.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:37:29.467576263Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-02T16:37:30.493240032Z","level":"INFO","msg":"stream: created new stream","id":"7ovz4jzt"}
+{"time":"2025-10-02T16:37:30.493282902Z","level":"INFO","msg":"stream: started","id":"7ovz4jzt"}
+{"time":"2025-10-02T16:37:30.493310273Z","level":"INFO","msg":"writer: started","stream_id":"7ovz4jzt"}
+{"time":"2025-10-02T16:37:30.493324013Z","level":"INFO","msg":"sender: started","stream_id":"7ovz4jzt"}
+{"time":"2025-10-02T16:37:30.493358514Z","level":"INFO","msg":"handler: started","stream_id":"7ovz4jzt"}
diff --git a/glue_l1_regression/wandb/wandb/debug.log b/glue_l1_regression/wandb/wandb/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/files/output.log b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..99d85205b7a20611d3efeba3f676a9296073a5ee
--- /dev/null
+++ b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/files/output.log
@@ -0,0 +1,64306 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+10/02 [16:37:31] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+10/02 [16:37:42] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130
+10/02 [16:37:43] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Glue
+****** length of the dataset: 10316
+****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE
+****** Expect one of: []
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: []
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+10/02 [16:37:49] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.model.layer_norm1.weight', 'action_head.model.layer_norm1.bias', 'action_head.model.fc1.weight', 'action_head.model.fc1.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.1.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.1.bias', 'action_head.model.layer_norm2.weight', 'action_head.model.layer_norm2.bias', 'action_head.model.fc2.weight', 'action_head.model.fc2.bias', 'proprio_projector.fc1.weight', 'proprio_projector.fc1.bias', 'proprio_projector.fc2.weight', 'proprio_projector.fc2.bias']
+unexpected keys: []
+************************* Initialize model successful!
+************************* LoRA flags: use_lora=True, lora_llm=False, lora_vit=False, lora_connector=False
+************************* Before add lora to model
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+************* Before get lora params
+************* After get lora params successfully
+10/02 [16:39:03] INFO | >> Constructing optimizer with 2 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 35614
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=35,614
+10/02 [16:39:04] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109
+ sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor).
+ timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch]
+
+[step=1/500000]
+ train/ActionL1Loss=0.6606
+ throughput/total_tokens=192,000
+ System/Peak GPU Memory (MB)=40,144
+[step=2/500000]
+ train/ActionL1Loss=0.6682
+ throughput/total_tokens=384,000
+ throughput/device/tokens_per_second=1,214
+ throughput/device/batches_per_second=0.0506
+ System/Peak GPU Memory (MB)=46,917
+[step=3/500000]
+ train/ActionL1Loss=0.6331
+ throughput/total_tokens=576,000
+ throughput/device/tokens_per_second=1,196
+ throughput/device/batches_per_second=0.0499
+[step=4/500000]
+ train/ActionL1Loss=0.6222
+ throughput/total_tokens=768,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=5/500000]
+ train/ActionL1Loss=0.5762
+ throughput/total_tokens=960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6/500000]
+ train/ActionL1Loss=0.5801
+ throughput/total_tokens=1,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7/500000]
+ train/ActionL1Loss=0.5002
+ throughput/total_tokens=1,344,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8/500000]
+ train/ActionL1Loss=0.5146
+ throughput/total_tokens=1,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9/500000]
+ train/ActionL1Loss=0.5447
+ throughput/total_tokens=1,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10/500000]
+ train/ActionL1Loss=0.4233
+ throughput/total_tokens=1,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11/500000]
+ train/ActionL1Loss=0.4707
+ throughput/total_tokens=2,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12/500000]
+ train/ActionL1Loss=0.4174
+ throughput/total_tokens=2,304,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=13/500000]
+ train/ActionL1Loss=0.5040
+ throughput/total_tokens=2,496,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=14/500000]
+ train/ActionL1Loss=0.4156
+ throughput/total_tokens=2,688,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=15/500000]
+ train/ActionL1Loss=0.3329
+ throughput/total_tokens=2,880,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=16/500000]
+ train/ActionL1Loss=0.4035
+ throughput/total_tokens=3,072,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=17/500000]
+ train/ActionL1Loss=0.4555
+ throughput/total_tokens=3,264,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=18/500000]
+ train/ActionL1Loss=0.5442
+ throughput/total_tokens=3,456,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=19/500000]
+ train/ActionL1Loss=0.3652
+ throughput/total_tokens=3,648,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=20/500000]
+ optim/total_grad_norm=20.53
+ train/ActionL1Loss=0.4465
+ throughput/total_tokens=3,840,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=21/500000]
+ train/ActionL1Loss=0.4670
+ throughput/total_tokens=4,032,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=22/500000]
+ train/ActionL1Loss=0.3712
+ throughput/total_tokens=4,224,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=23/500000]
+ train/ActionL1Loss=0.4888
+ throughput/total_tokens=4,416,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=24/500000]
+ train/ActionL1Loss=0.4259
+ throughput/total_tokens=4,608,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=25/500000]
+ train/ActionL1Loss=0.4471
+ throughput/total_tokens=4,800,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=26/500000]
+ train/ActionL1Loss=0.4744
+ throughput/total_tokens=4,992,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=27/500000]
+ train/ActionL1Loss=0.4111
+ throughput/total_tokens=5,184,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=28/500000]
+ train/ActionL1Loss=0.4400
+ throughput/total_tokens=5,376,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=29/500000]
+ train/ActionL1Loss=0.4456
+ throughput/total_tokens=5,568,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=30/500000]
+ train/ActionL1Loss=0.4581
+ throughput/total_tokens=5,760,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=31/500000]
+ train/ActionL1Loss=0.3012
+ throughput/total_tokens=5,952,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=32/500000]
+ train/ActionL1Loss=0.4191
+ throughput/total_tokens=6,144,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=33/500000]
+ train/ActionL1Loss=0.4199
+ throughput/total_tokens=6,336,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=34/500000]
+ train/ActionL1Loss=0.3712
+ throughput/total_tokens=6,528,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=35/500000]
+ train/ActionL1Loss=0.3663
+ throughput/total_tokens=6,720,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=36/500000]
+ train/ActionL1Loss=0.4052
+ throughput/total_tokens=6,912,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=37/500000]
+ train/ActionL1Loss=0.4858
+ throughput/total_tokens=7,104,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=38/500000]
+ train/ActionL1Loss=0.4051
+ throughput/total_tokens=7,296,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=39/500000]
+ train/ActionL1Loss=0.3161
+ throughput/total_tokens=7,488,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=40/500000]
+ optim/total_grad_norm=15.95
+ train/ActionL1Loss=0.4251
+ throughput/total_tokens=7,680,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=41/500000]
+ train/ActionL1Loss=0.3571
+ throughput/total_tokens=7,872,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=42/500000]
+ train/ActionL1Loss=0.4353
+ throughput/total_tokens=8,064,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=43/500000]
+ train/ActionL1Loss=0.2859
+ throughput/total_tokens=8,256,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=44/500000]
+ train/ActionL1Loss=0.4893
+ throughput/total_tokens=8,448,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=45/500000]
+ train/ActionL1Loss=0.3635
+ throughput/total_tokens=8,640,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=46/500000]
+ train/ActionL1Loss=0.3984
+ throughput/total_tokens=8,832,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=47/500000]
+ train/ActionL1Loss=0.3151
+ throughput/total_tokens=9,024,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=48/500000]
+ train/ActionL1Loss=0.4416
+ throughput/total_tokens=9,216,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=49/500000]
+ train/ActionL1Loss=0.3956
+ throughput/total_tokens=9,408,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=50/500000]
+ train/ActionL1Loss=0.3891
+ throughput/total_tokens=9,600,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=51/500000]
+ train/ActionL1Loss=0.2958
+ throughput/total_tokens=9,792,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=52/500000]
+ train/ActionL1Loss=0.4477
+ throughput/total_tokens=9,984,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=53/500000]
+ train/ActionL1Loss=0.5463
+ throughput/total_tokens=10,176,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=54/500000]
+ train/ActionL1Loss=0.4203
+ throughput/total_tokens=10,368,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=55/500000]
+ train/ActionL1Loss=0.4748
+ throughput/total_tokens=10,560,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=56/500000]
+ train/ActionL1Loss=0.5711
+ throughput/total_tokens=10,752,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=57/500000]
+ train/ActionL1Loss=0.4750
+ throughput/total_tokens=10,944,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=58/500000]
+ train/ActionL1Loss=0.3738
+ throughput/total_tokens=11,136,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0490
+[step=59/500000]
+ train/ActionL1Loss=0.3183
+ throughput/total_tokens=11,328,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=60/500000]
+ optim/total_grad_norm=20.99
+ train/ActionL1Loss=0.4038
+ throughput/total_tokens=11,520,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+ System/Peak GPU Memory (MB)=46,917
+[step=61/500000]
+ train/ActionL1Loss=0.4500
+ throughput/total_tokens=11,712,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=62/500000]
+ train/ActionL1Loss=0.3982
+ throughput/total_tokens=11,904,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=63/500000]
+ train/ActionL1Loss=0.3293
+ throughput/total_tokens=12,096,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=64/500000]
+ train/ActionL1Loss=0.4426
+ throughput/total_tokens=12,288,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=65/500000]
+ train/ActionL1Loss=0.4282
+ throughput/total_tokens=12,480,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=66/500000]
+ train/ActionL1Loss=0.3485
+ throughput/total_tokens=12,672,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=67/500000]
+ train/ActionL1Loss=0.4177
+ throughput/total_tokens=12,864,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=68/500000]
+ train/ActionL1Loss=0.3172
+ throughput/total_tokens=13,056,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=69/500000]
+ train/ActionL1Loss=0.4425
+ throughput/total_tokens=13,248,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=70/500000]
+ train/ActionL1Loss=0.4702
+ throughput/total_tokens=13,440,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=71/500000]
+ train/ActionL1Loss=0.3319
+ throughput/total_tokens=13,632,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=72/500000]
+ train/ActionL1Loss=0.3323
+ throughput/total_tokens=13,824,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=73/500000]
+ train/ActionL1Loss=0.4778
+ throughput/total_tokens=14,016,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=74/500000]
+ train/ActionL1Loss=0.4804
+ throughput/total_tokens=14,208,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=75/500000]
+ train/ActionL1Loss=0.2698
+ throughput/total_tokens=14,400,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=76/500000]
+ train/ActionL1Loss=0.4458
+ throughput/total_tokens=14,592,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=77/500000]
+ train/ActionL1Loss=0.4586
+ throughput/total_tokens=14,784,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=78/500000]
+ train/ActionL1Loss=0.2402
+ throughput/total_tokens=14,976,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=79/500000]
+ train/ActionL1Loss=0.3508
+ throughput/total_tokens=15,168,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=80/500000]
+ optim/total_grad_norm=22.00
+ train/ActionL1Loss=0.3772
+ throughput/total_tokens=15,360,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=81/500000]
+ train/ActionL1Loss=0.2776
+ throughput/total_tokens=15,552,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=82/500000]
+ train/ActionL1Loss=0.3576
+ throughput/total_tokens=15,744,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=83/500000]
+ train/ActionL1Loss=0.3556
+ throughput/total_tokens=15,936,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=84/500000]
+ train/ActionL1Loss=0.2589
+ throughput/total_tokens=16,128,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=85/500000]
+ train/ActionL1Loss=0.3161
+ throughput/total_tokens=16,320,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=86/500000]
+ train/ActionL1Loss=0.2971
+ throughput/total_tokens=16,512,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=87/500000]
+ train/ActionL1Loss=0.2837
+ throughput/total_tokens=16,704,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=88/500000]
+ train/ActionL1Loss=0.2450
+ throughput/total_tokens=16,896,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=89/500000]
+ train/ActionL1Loss=0.2160
+ throughput/total_tokens=17,088,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=90/500000]
+ train/ActionL1Loss=0.2609
+ throughput/total_tokens=17,280,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=91/500000]
+ train/ActionL1Loss=0.2988
+ throughput/total_tokens=17,472,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=92/500000]
+ train/ActionL1Loss=0.2838
+ throughput/total_tokens=17,664,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=93/500000]
+ train/ActionL1Loss=0.3007
+ throughput/total_tokens=17,856,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=94/500000]
+ train/ActionL1Loss=0.2933
+ throughput/total_tokens=18,048,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=95/500000]
+ train/ActionL1Loss=0.2765
+ throughput/total_tokens=18,240,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=96/500000]
+ train/ActionL1Loss=0.2539
+ throughput/total_tokens=18,432,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=97/500000]
+ train/ActionL1Loss=0.2644
+ throughput/total_tokens=18,624,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=98/500000]
+ train/ActionL1Loss=0.2753
+ throughput/total_tokens=18,816,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=99/500000]
+ train/ActionL1Loss=0.2411
+ throughput/total_tokens=19,008,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=100/500000]
+ optim/total_grad_norm=19.69
+ train/ActionL1Loss=0.2207
+ throughput/total_tokens=19,200,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=101/500000]
+ train/ActionL1Loss=0.2253
+ throughput/total_tokens=19,392,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=102/500000]
+ train/ActionL1Loss=0.2572
+ throughput/total_tokens=19,584,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=103/500000]
+ train/ActionL1Loss=0.2184
+ throughput/total_tokens=19,776,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=104/500000]
+ train/ActionL1Loss=0.2631
+ throughput/total_tokens=19,968,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=105/500000]
+ train/ActionL1Loss=0.2687
+ throughput/total_tokens=20,160,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=106/500000]
+ train/ActionL1Loss=0.2880
+ throughput/total_tokens=20,352,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=107/500000]
+ train/ActionL1Loss=0.2337
+ throughput/total_tokens=20,544,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=108/500000]
+ train/ActionL1Loss=0.2202
+ throughput/total_tokens=20,736,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=109/500000]
+ train/ActionL1Loss=0.2220
+ throughput/total_tokens=20,928,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=110/500000]
+ train/ActionL1Loss=0.2418
+ throughput/total_tokens=21,120,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=111/500000]
+ train/ActionL1Loss=0.2354
+ throughput/total_tokens=21,312,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=112/500000]
+ train/ActionL1Loss=0.2462
+ throughput/total_tokens=21,504,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=113/500000]
+ train/ActionL1Loss=0.2348
+ throughput/total_tokens=21,696,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=114/500000]
+ train/ActionL1Loss=0.2299
+ throughput/total_tokens=21,888,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=115/500000]
+ train/ActionL1Loss=0.2522
+ throughput/total_tokens=22,080,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=116/500000]
+ train/ActionL1Loss=0.2313
+ throughput/total_tokens=22,272,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=117/500000]
+ train/ActionL1Loss=0.2435
+ throughput/total_tokens=22,464,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=118/500000]
+ train/ActionL1Loss=0.2556
+ throughput/total_tokens=22,656,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=119/500000]
+ train/ActionL1Loss=0.2429
+ throughput/total_tokens=22,848,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=120/500000]
+ optim/total_grad_norm=23.64
+ train/ActionL1Loss=0.2896
+ throughput/total_tokens=23,040,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=121/500000]
+ train/ActionL1Loss=0.2347
+ throughput/total_tokens=23,232,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=122/500000]
+ train/ActionL1Loss=0.2611
+ throughput/total_tokens=23,424,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=123/500000]
+ train/ActionL1Loss=0.2104
+ throughput/total_tokens=23,616,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=124/500000]
+ train/ActionL1Loss=0.2489
+ throughput/total_tokens=23,808,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=125/500000]
+ train/ActionL1Loss=0.2176
+ throughput/total_tokens=24,000,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=126/500000]
+ train/ActionL1Loss=0.2223
+ throughput/total_tokens=24,192,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=127/500000]
+ train/ActionL1Loss=0.2629
+ throughput/total_tokens=24,384,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=128/500000]
+ train/ActionL1Loss=0.2531
+ throughput/total_tokens=24,576,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=129/500000]
+ train/ActionL1Loss=0.2517
+ throughput/total_tokens=24,768,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=130/500000]
+ train/ActionL1Loss=0.2499
+ throughput/total_tokens=24,960,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=131/500000]
+ train/ActionL1Loss=0.2575
+ throughput/total_tokens=25,152,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=132/500000]
+ train/ActionL1Loss=0.2220
+ throughput/total_tokens=25,344,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=133/500000]
+ train/ActionL1Loss=0.2378
+ throughput/total_tokens=25,536,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=134/500000]
+ train/ActionL1Loss=0.2407
+ throughput/total_tokens=25,728,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=135/500000]
+ train/ActionL1Loss=0.2236
+ throughput/total_tokens=25,920,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=136/500000]
+ train/ActionL1Loss=0.2387
+ throughput/total_tokens=26,112,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=137/500000]
+ train/ActionL1Loss=0.2387
+ throughput/total_tokens=26,304,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=138/500000]
+ train/ActionL1Loss=0.2049
+ throughput/total_tokens=26,496,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=139/500000]
+ train/ActionL1Loss=0.2269
+ throughput/total_tokens=26,688,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=140/500000]
+ optim/total_grad_norm=19.99
+ train/ActionL1Loss=0.2372
+ throughput/total_tokens=26,880,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=141/500000]
+ train/ActionL1Loss=0.2112
+ throughput/total_tokens=27,072,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=142/500000]
+ train/ActionL1Loss=0.2280
+ throughput/total_tokens=27,264,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=143/500000]
+ train/ActionL1Loss=0.2583
+ throughput/total_tokens=27,456,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=144/500000]
+ train/ActionL1Loss=0.2451
+ throughput/total_tokens=27,648,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=145/500000]
+ train/ActionL1Loss=0.2328
+ throughput/total_tokens=27,840,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=146/500000]
+ train/ActionL1Loss=0.2172
+ throughput/total_tokens=28,032,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=147/500000]
+ train/ActionL1Loss=0.2484
+ throughput/total_tokens=28,224,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=148/500000]
+ train/ActionL1Loss=0.2113
+ throughput/total_tokens=28,416,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=149/500000]
+ train/ActionL1Loss=0.2387
+ throughput/total_tokens=28,608,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=150/500000]
+ train/ActionL1Loss=0.2573
+ throughput/total_tokens=28,800,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=151/500000]
+ train/ActionL1Loss=0.2581
+ throughput/total_tokens=28,992,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=152/500000]
+ train/ActionL1Loss=0.2783
+ throughput/total_tokens=29,184,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=153/500000]
+ train/ActionL1Loss=0.2441
+ throughput/total_tokens=29,376,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=154/500000]
+ train/ActionL1Loss=0.2540
+ throughput/total_tokens=29,568,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=155/500000]
+ train/ActionL1Loss=0.2251
+ throughput/total_tokens=29,760,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=156/500000]
+ train/ActionL1Loss=0.2275
+ throughput/total_tokens=29,952,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=157/500000]
+ train/ActionL1Loss=0.2321
+ throughput/total_tokens=30,144,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=158/500000]
+ train/ActionL1Loss=0.2422
+ throughput/total_tokens=30,336,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=159/500000]
+ train/ActionL1Loss=0.2381
+ throughput/total_tokens=30,528,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=160/500000]
+ optim/total_grad_norm=31.55
+ train/ActionL1Loss=0.2459
+ throughput/total_tokens=30,720,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=161/500000]
+ train/ActionL1Loss=0.2383
+ throughput/total_tokens=30,912,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=162/500000]
+ train/ActionL1Loss=0.2023
+ throughput/total_tokens=31,104,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=163/500000]
+ train/ActionL1Loss=0.2611
+ throughput/total_tokens=31,296,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=164/500000]
+ train/ActionL1Loss=0.2540
+ throughput/total_tokens=31,488,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=165/500000]
+ train/ActionL1Loss=0.2282
+ throughput/total_tokens=31,680,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=166/500000]
+ train/ActionL1Loss=0.2281
+ throughput/total_tokens=31,872,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=167/500000]
+ train/ActionL1Loss=0.2216
+ throughput/total_tokens=32,064,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=168/500000]
+ train/ActionL1Loss=0.2254
+ throughput/total_tokens=32,256,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=169/500000]
+ train/ActionL1Loss=0.2558
+ throughput/total_tokens=32,448,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=170/500000]
+ train/ActionL1Loss=0.2150
+ throughput/total_tokens=32,640,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=171/500000]
+ train/ActionL1Loss=0.2343
+ throughput/total_tokens=32,832,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=172/500000]
+ train/ActionL1Loss=0.2433
+ throughput/total_tokens=33,024,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=173/500000]
+ train/ActionL1Loss=0.2602
+ throughput/total_tokens=33,216,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=174/500000]
+ train/ActionL1Loss=0.1961
+ throughput/total_tokens=33,408,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=175/500000]
+ train/ActionL1Loss=0.2087
+ throughput/total_tokens=33,600,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=176/500000]
+ train/ActionL1Loss=0.2371
+ throughput/total_tokens=33,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=177/500000]
+ train/ActionL1Loss=0.2352
+ throughput/total_tokens=33,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=178/500000]
+ train/ActionL1Loss=0.2306
+ throughput/total_tokens=34,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=179/500000]
+ train/ActionL1Loss=0.2397
+ throughput/total_tokens=34,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=180/500000]
+ optim/total_grad_norm=21.88
+ train/ActionL1Loss=0.2087
+ throughput/total_tokens=34,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=181/500000]
+ train/ActionL1Loss=0.2135
+ throughput/total_tokens=34,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=182/500000]
+ train/ActionL1Loss=0.2072
+ throughput/total_tokens=34,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=183/500000]
+ train/ActionL1Loss=0.2637
+ throughput/total_tokens=35,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=184/500000]
+ train/ActionL1Loss=0.2438
+ throughput/total_tokens=35,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=185/500000]
+ train/ActionL1Loss=0.2099
+ throughput/total_tokens=35,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=186/500000]
+ train/ActionL1Loss=0.2379
+ throughput/total_tokens=35,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=187/500000]
+ train/ActionL1Loss=0.2354
+ throughput/total_tokens=35,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=188/500000]
+ train/ActionL1Loss=0.2171
+ throughput/total_tokens=36,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=189/500000]
+ train/ActionL1Loss=0.2134
+ throughput/total_tokens=36,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=190/500000]
+ train/ActionL1Loss=0.2152
+ throughput/total_tokens=36,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=191/500000]
+ train/ActionL1Loss=0.2089
+ throughput/total_tokens=36,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=192/500000]
+ train/ActionL1Loss=0.2501
+ throughput/total_tokens=36,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=193/500000]
+ train/ActionL1Loss=0.2126
+ throughput/total_tokens=37,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=194/500000]
+ train/ActionL1Loss=0.2037
+ throughput/total_tokens=37,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=195/500000]
+ train/ActionL1Loss=0.1908
+ throughput/total_tokens=37,440,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=196/500000]
+ train/ActionL1Loss=0.1830
+ throughput/total_tokens=37,632,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=197/500000]
+ train/ActionL1Loss=0.2259
+ throughput/total_tokens=37,824,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=198/500000]
+ train/ActionL1Loss=0.2148
+ throughput/total_tokens=38,016,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=199/500000]
+ train/ActionL1Loss=0.1827
+ throughput/total_tokens=38,208,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=200/500000]
+ optim/total_grad_norm=21.80
+ train/ActionL1Loss=0.2116
+ throughput/total_tokens=38,400,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=201/500000]
+ train/ActionL1Loss=0.2362
+ throughput/total_tokens=38,592,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=202/500000]
+ train/ActionL1Loss=0.2205
+ throughput/total_tokens=38,784,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=203/500000]
+ train/ActionL1Loss=0.2281
+ throughput/total_tokens=38,976,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=204/500000]
+ train/ActionL1Loss=0.1844
+ throughput/total_tokens=39,168,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=205/500000]
+ train/ActionL1Loss=0.2034
+ throughput/total_tokens=39,360,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=206/500000]
+ train/ActionL1Loss=0.1963
+ throughput/total_tokens=39,552,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=207/500000]
+ train/ActionL1Loss=0.2027
+ throughput/total_tokens=39,744,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=208/500000]
+ train/ActionL1Loss=0.2071
+ throughput/total_tokens=39,936,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=209/500000]
+ train/ActionL1Loss=0.1933
+ throughput/total_tokens=40,128,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=210/500000]
+ train/ActionL1Loss=0.2118
+ throughput/total_tokens=40,320,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=211/500000]
+ train/ActionL1Loss=0.2147
+ throughput/total_tokens=40,512,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=212/500000]
+ train/ActionL1Loss=0.2124
+ throughput/total_tokens=40,704,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=213/500000]
+ train/ActionL1Loss=0.2208
+ throughput/total_tokens=40,896,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=214/500000]
+ train/ActionL1Loss=0.2042
+ throughput/total_tokens=41,088,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=215/500000]
+ train/ActionL1Loss=0.1777
+ throughput/total_tokens=41,280,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=216/500000]
+ train/ActionL1Loss=0.2007
+ throughput/total_tokens=41,472,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=217/500000]
+ train/ActionL1Loss=0.1943
+ throughput/total_tokens=41,664,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=218/500000]
+ train/ActionL1Loss=0.2148
+ throughput/total_tokens=41,856,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=219/500000]
+ train/ActionL1Loss=0.1785
+ throughput/total_tokens=42,048,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=220/500000]
+ optim/total_grad_norm=31.32
+ train/ActionL1Loss=0.2416
+ throughput/total_tokens=42,240,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=221/500000]
+ train/ActionL1Loss=0.2267
+ throughput/total_tokens=42,432,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=222/500000]
+ train/ActionL1Loss=0.2174
+ throughput/total_tokens=42,624,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=223/500000]
+ train/ActionL1Loss=0.2110
+ throughput/total_tokens=42,816,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=224/500000]
+ train/ActionL1Loss=0.1909
+ throughput/total_tokens=43,008,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=225/500000]
+ train/ActionL1Loss=0.1830
+ throughput/total_tokens=43,200,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=226/500000]
+ train/ActionL1Loss=0.2041
+ throughput/total_tokens=43,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=227/500000]
+ train/ActionL1Loss=0.1996
+ throughput/total_tokens=43,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=228/500000]
+ train/ActionL1Loss=0.1767
+ throughput/total_tokens=43,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=229/500000]
+ train/ActionL1Loss=0.1600
+ throughput/total_tokens=43,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=230/500000]
+ train/ActionL1Loss=0.2081
+ throughput/total_tokens=44,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=231/500000]
+ train/ActionL1Loss=0.1945
+ throughput/total_tokens=44,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=232/500000]
+ train/ActionL1Loss=0.1766
+ throughput/total_tokens=44,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=233/500000]
+ train/ActionL1Loss=0.1533
+ throughput/total_tokens=44,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=234/500000]
+ train/ActionL1Loss=0.1825
+ throughput/total_tokens=44,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=235/500000]
+ train/ActionL1Loss=0.1731
+ throughput/total_tokens=45,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=236/500000]
+ train/ActionL1Loss=0.1810
+ throughput/total_tokens=45,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=237/500000]
+ train/ActionL1Loss=0.1868
+ throughput/total_tokens=45,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=238/500000]
+ train/ActionL1Loss=0.1946
+ throughput/total_tokens=45,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=239/500000]
+ train/ActionL1Loss=0.1713
+ throughput/total_tokens=45,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=240/500000]
+ optim/total_grad_norm=23.22
+ train/ActionL1Loss=0.1905
+ throughput/total_tokens=46,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=241/500000]
+ train/ActionL1Loss=0.1897
+ throughput/total_tokens=46,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=242/500000]
+ train/ActionL1Loss=0.1869
+ throughput/total_tokens=46,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=243/500000]
+ train/ActionL1Loss=0.1769
+ throughput/total_tokens=46,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=244/500000]
+ train/ActionL1Loss=0.1996
+ throughput/total_tokens=46,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=245/500000]
+ train/ActionL1Loss=0.1921
+ throughput/total_tokens=47,040,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=246/500000]
+ train/ActionL1Loss=0.1971
+ throughput/total_tokens=47,232,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=247/500000]
+ train/ActionL1Loss=0.1718
+ throughput/total_tokens=47,424,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=248/500000]
+ train/ActionL1Loss=0.1910
+ throughput/total_tokens=47,616,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=249/500000]
+ train/ActionL1Loss=0.1973
+ throughput/total_tokens=47,808,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=250/500000]
+ train/ActionL1Loss=0.1913
+ throughput/total_tokens=48,000,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=251/500000]
+ train/ActionL1Loss=0.1871
+ throughput/total_tokens=48,192,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=252/500000]
+ train/ActionL1Loss=0.1795
+ throughput/total_tokens=48,384,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=253/500000]
+ train/ActionL1Loss=0.1760
+ throughput/total_tokens=48,576,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=254/500000]
+ train/ActionL1Loss=0.1745
+ throughput/total_tokens=48,768,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=255/500000]
+ train/ActionL1Loss=0.1720
+ throughput/total_tokens=48,960,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=256/500000]
+ train/ActionL1Loss=0.1465
+ throughput/total_tokens=49,152,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=257/500000]
+ train/ActionL1Loss=0.1491
+ throughput/total_tokens=49,344,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=258/500000]
+ train/ActionL1Loss=0.1661
+ throughput/total_tokens=49,536,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=259/500000]
+ train/ActionL1Loss=0.1405
+ throughput/total_tokens=49,728,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=260/500000]
+ optim/total_grad_norm=20.52
+ train/ActionL1Loss=0.1843
+ throughput/total_tokens=49,920,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=261/500000]
+ train/ActionL1Loss=0.1773
+ throughput/total_tokens=50,112,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=262/500000]
+ train/ActionL1Loss=0.1550
+ throughput/total_tokens=50,304,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=263/500000]
+ train/ActionL1Loss=0.1512
+ throughput/total_tokens=50,496,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=264/500000]
+ train/ActionL1Loss=0.1791
+ throughput/total_tokens=50,688,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=265/500000]
+ train/ActionL1Loss=0.1537
+ throughput/total_tokens=50,880,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=266/500000]
+ train/ActionL1Loss=0.2147
+ throughput/total_tokens=51,072,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=267/500000]
+ train/ActionL1Loss=0.1582
+ throughput/total_tokens=51,264,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=268/500000]
+ train/ActionL1Loss=0.1627
+ throughput/total_tokens=51,456,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=269/500000]
+ train/ActionL1Loss=0.1838
+ throughput/total_tokens=51,648,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=270/500000]
+ train/ActionL1Loss=0.1810
+ throughput/total_tokens=51,840,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=271/500000]
+ train/ActionL1Loss=0.1844
+ throughput/total_tokens=52,032,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=272/500000]
+ train/ActionL1Loss=0.1731
+ throughput/total_tokens=52,224,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=273/500000]
+ train/ActionL1Loss=0.1759
+ throughput/total_tokens=52,416,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=274/500000]
+ train/ActionL1Loss=0.1926
+ throughput/total_tokens=52,608,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=275/500000]
+ train/ActionL1Loss=0.1920
+ throughput/total_tokens=52,800,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=276/500000]
+ train/ActionL1Loss=0.1523
+ throughput/total_tokens=52,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=277/500000]
+ train/ActionL1Loss=0.1771
+ throughput/total_tokens=53,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=278/500000]
+ train/ActionL1Loss=0.1562
+ throughput/total_tokens=53,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=279/500000]
+ train/ActionL1Loss=0.1646
+ throughput/total_tokens=53,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=280/500000]
+ optim/total_grad_norm=23.47
+ train/ActionL1Loss=0.1687
+ throughput/total_tokens=53,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=281/500000]
+ train/ActionL1Loss=0.1640
+ throughput/total_tokens=53,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=282/500000]
+ train/ActionL1Loss=0.1904
+ throughput/total_tokens=54,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=283/500000]
+ train/ActionL1Loss=0.1673
+ throughput/total_tokens=54,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=284/500000]
+ train/ActionL1Loss=0.1981
+ throughput/total_tokens=54,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=285/500000]
+ train/ActionL1Loss=0.1993
+ throughput/total_tokens=54,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=286/500000]
+ train/ActionL1Loss=0.1647
+ throughput/total_tokens=54,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=287/500000]
+ train/ActionL1Loss=0.1820
+ throughput/total_tokens=55,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=288/500000]
+ train/ActionL1Loss=0.1752
+ throughput/total_tokens=55,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=289/500000]
+ train/ActionL1Loss=0.1903
+ throughput/total_tokens=55,488,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=290/500000]
+ train/ActionL1Loss=0.2063
+ throughput/total_tokens=55,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=291/500000]
+ train/ActionL1Loss=0.1892
+ throughput/total_tokens=55,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=292/500000]
+ train/ActionL1Loss=0.1590
+ throughput/total_tokens=56,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=293/500000]
+ train/ActionL1Loss=0.1595
+ throughput/total_tokens=56,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=294/500000]
+ train/ActionL1Loss=0.1527
+ throughput/total_tokens=56,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=295/500000]
+ train/ActionL1Loss=0.1673
+ throughput/total_tokens=56,640,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=296/500000]
+ train/ActionL1Loss=0.1617
+ throughput/total_tokens=56,832,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=297/500000]
+ train/ActionL1Loss=0.1545
+ throughput/total_tokens=57,024,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=298/500000]
+ train/ActionL1Loss=0.1791
+ throughput/total_tokens=57,216,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=299/500000]
+ train/ActionL1Loss=0.2119
+ throughput/total_tokens=57,408,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=300/500000]
+ optim/total_grad_norm=20.43
+ train/ActionL1Loss=0.1520
+ throughput/total_tokens=57,600,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=301/500000]
+ train/ActionL1Loss=0.1722
+ throughput/total_tokens=57,792,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=302/500000]
+ train/ActionL1Loss=0.1706
+ throughput/total_tokens=57,984,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=303/500000]
+ train/ActionL1Loss=0.1600
+ throughput/total_tokens=58,176,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=304/500000]
+ train/ActionL1Loss=0.1792
+ throughput/total_tokens=58,368,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=305/500000]
+ train/ActionL1Loss=0.2148
+ throughput/total_tokens=58,560,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=306/500000]
+ train/ActionL1Loss=0.1504
+ throughput/total_tokens=58,752,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=307/500000]
+ train/ActionL1Loss=0.1527
+ throughput/total_tokens=58,944,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=308/500000]
+ train/ActionL1Loss=0.1664
+ throughput/total_tokens=59,136,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=309/500000]
+ train/ActionL1Loss=0.1738
+ throughput/total_tokens=59,328,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=310/500000]
+ train/ActionL1Loss=0.1689
+ throughput/total_tokens=59,520,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=311/500000]
+ train/ActionL1Loss=0.1578
+ throughput/total_tokens=59,712,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=312/500000]
+ train/ActionL1Loss=0.1811
+ throughput/total_tokens=59,904,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=313/500000]
+ train/ActionL1Loss=0.1927
+ throughput/total_tokens=60,096,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=314/500000]
+ train/ActionL1Loss=0.1825
+ throughput/total_tokens=60,288,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=315/500000]
+ train/ActionL1Loss=0.1454
+ throughput/total_tokens=60,480,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=316/500000]
+ train/ActionL1Loss=0.1820
+ throughput/total_tokens=60,672,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=317/500000]
+ train/ActionL1Loss=0.1471
+ throughput/total_tokens=60,864,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=318/500000]
+ train/ActionL1Loss=0.1585
+ throughput/total_tokens=61,056,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=319/500000]
+ train/ActionL1Loss=0.1545
+ throughput/total_tokens=61,248,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=320/500000]
+ optim/total_grad_norm=21.65
+ train/ActionL1Loss=0.1570
+ throughput/total_tokens=61,440,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=321/500000]
+ train/ActionL1Loss=0.1482
+ throughput/total_tokens=61,632,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=322/500000]
+ train/ActionL1Loss=0.1323
+ throughput/total_tokens=61,824,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=323/500000]
+ train/ActionL1Loss=0.1584
+ throughput/total_tokens=62,016,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=324/500000]
+ train/ActionL1Loss=0.1555
+ throughput/total_tokens=62,208,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=325/500000]
+ train/ActionL1Loss=0.1721
+ throughput/total_tokens=62,400,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=326/500000]
+ train/ActionL1Loss=0.1553
+ throughput/total_tokens=62,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=327/500000]
+ train/ActionL1Loss=0.1688
+ throughput/total_tokens=62,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=328/500000]
+ train/ActionL1Loss=0.1652
+ throughput/total_tokens=62,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=329/500000]
+ train/ActionL1Loss=0.1628
+ throughput/total_tokens=63,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=330/500000]
+ train/ActionL1Loss=0.1731
+ throughput/total_tokens=63,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=331/500000]
+ train/ActionL1Loss=0.1460
+ throughput/total_tokens=63,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=332/500000]
+ train/ActionL1Loss=0.1435
+ throughput/total_tokens=63,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=333/500000]
+ train/ActionL1Loss=0.1517
+ throughput/total_tokens=63,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=334/500000]
+ train/ActionL1Loss=0.1779
+ throughput/total_tokens=64,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=335/500000]
+ train/ActionL1Loss=0.1486
+ throughput/total_tokens=64,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=336/500000]
+ train/ActionL1Loss=0.1639
+ throughput/total_tokens=64,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=337/500000]
+ train/ActionL1Loss=0.1400
+ throughput/total_tokens=64,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=338/500000]
+ train/ActionL1Loss=0.1540
+ throughput/total_tokens=64,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=339/500000]
+ train/ActionL1Loss=0.1562
+ throughput/total_tokens=65,088,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=340/500000]
+ optim/total_grad_norm=23.16
+ train/ActionL1Loss=0.1565
+ throughput/total_tokens=65,280,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=341/500000]
+ train/ActionL1Loss=0.1522
+ throughput/total_tokens=65,472,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=342/500000]
+ train/ActionL1Loss=0.1255
+ throughput/total_tokens=65,664,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=343/500000]
+ train/ActionL1Loss=0.1406
+ throughput/total_tokens=65,856,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=344/500000]
+ train/ActionL1Loss=0.1701
+ throughput/total_tokens=66,048,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=345/500000]
+ train/ActionL1Loss=0.1711
+ throughput/total_tokens=66,240,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=346/500000]
+ train/ActionL1Loss=0.1359
+ throughput/total_tokens=66,432,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=347/500000]
+ train/ActionL1Loss=0.1313
+ throughput/total_tokens=66,624,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=348/500000]
+ train/ActionL1Loss=0.1486
+ throughput/total_tokens=66,816,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=349/500000]
+ train/ActionL1Loss=0.1419
+ throughput/total_tokens=67,008,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=350/500000]
+ train/ActionL1Loss=0.1361
+ throughput/total_tokens=67,200,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=351/500000]
+ train/ActionL1Loss=0.1494
+ throughput/total_tokens=67,392,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=352/500000]
+ train/ActionL1Loss=0.1498
+ throughput/total_tokens=67,584,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=353/500000]
+ train/ActionL1Loss=0.1561
+ throughput/total_tokens=67,776,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=354/500000]
+ train/ActionL1Loss=0.1289
+ throughput/total_tokens=67,968,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=355/500000]
+ train/ActionL1Loss=0.1285
+ throughput/total_tokens=68,160,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=356/500000]
+ train/ActionL1Loss=0.1503
+ throughput/total_tokens=68,352,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=357/500000]
+ train/ActionL1Loss=0.1098
+ throughput/total_tokens=68,544,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=358/500000]
+ train/ActionL1Loss=0.1387
+ throughput/total_tokens=68,736,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=359/500000]
+ train/ActionL1Loss=0.1452
+ throughput/total_tokens=68,928,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=360/500000]
+ optim/total_grad_norm=20.25
+ train/ActionL1Loss=0.1295
+ throughput/total_tokens=69,120,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=361/500000]
+ train/ActionL1Loss=0.1376
+ throughput/total_tokens=69,312,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=362/500000]
+ train/ActionL1Loss=0.1419
+ throughput/total_tokens=69,504,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=363/500000]
+ train/ActionL1Loss=0.1379
+ throughput/total_tokens=69,696,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=364/500000]
+ train/ActionL1Loss=0.1555
+ throughput/total_tokens=69,888,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=365/500000]
+ train/ActionL1Loss=0.1624
+ throughput/total_tokens=70,080,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=366/500000]
+ train/ActionL1Loss=0.1415
+ throughput/total_tokens=70,272,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=367/500000]
+ train/ActionL1Loss=0.1397
+ throughput/total_tokens=70,464,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=368/500000]
+ train/ActionL1Loss=0.1745
+ throughput/total_tokens=70,656,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=369/500000]
+ train/ActionL1Loss=0.1583
+ throughput/total_tokens=70,848,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=370/500000]
+ train/ActionL1Loss=0.1538
+ throughput/total_tokens=71,040,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=371/500000]
+ train/ActionL1Loss=0.1381
+ throughput/total_tokens=71,232,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=372/500000]
+ train/ActionL1Loss=0.1587
+ throughput/total_tokens=71,424,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=373/500000]
+ train/ActionL1Loss=0.1450
+ throughput/total_tokens=71,616,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=374/500000]
+ train/ActionL1Loss=0.1517
+ throughput/total_tokens=71,808,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=375/500000]
+ train/ActionL1Loss=0.1376
+ throughput/total_tokens=72,000,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=376/500000]
+ train/ActionL1Loss=0.1347
+ throughput/total_tokens=72,192,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=377/500000]
+ train/ActionL1Loss=0.1273
+ throughput/total_tokens=72,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=378/500000]
+ train/ActionL1Loss=0.1453
+ throughput/total_tokens=72,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=379/500000]
+ train/ActionL1Loss=0.1553
+ throughput/total_tokens=72,768,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=380/500000]
+ optim/total_grad_norm=16.06
+ train/ActionL1Loss=0.1248
+ throughput/total_tokens=72,960,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=381/500000]
+ train/ActionL1Loss=0.1263
+ throughput/total_tokens=73,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=382/500000]
+ train/ActionL1Loss=0.1357
+ throughput/total_tokens=73,344,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=383/500000]
+ train/ActionL1Loss=0.1243
+ throughput/total_tokens=73,536,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=384/500000]
+ train/ActionL1Loss=0.1273
+ throughput/total_tokens=73,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=385/500000]
+ train/ActionL1Loss=0.1412
+ throughput/total_tokens=73,920,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=386/500000]
+ train/ActionL1Loss=0.1377
+ throughput/total_tokens=74,112,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=387/500000]
+ train/ActionL1Loss=0.1622
+ throughput/total_tokens=74,304,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=388/500000]
+ train/ActionL1Loss=0.1477
+ throughput/total_tokens=74,496,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=389/500000]
+ train/ActionL1Loss=0.1382
+ throughput/total_tokens=74,688,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=390/500000]
+ train/ActionL1Loss=0.1539
+ throughput/total_tokens=74,880,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=391/500000]
+ train/ActionL1Loss=0.1578
+ throughput/total_tokens=75,072,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=392/500000]
+ train/ActionL1Loss=0.1497
+ throughput/total_tokens=75,264,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=393/500000]
+ train/ActionL1Loss=0.1500
+ throughput/total_tokens=75,456,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=394/500000]
+ train/ActionL1Loss=0.1576
+ throughput/total_tokens=75,648,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=395/500000]
+ train/ActionL1Loss=0.1368
+ throughput/total_tokens=75,840,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=396/500000]
+ train/ActionL1Loss=0.1192
+ throughput/total_tokens=76,032,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=397/500000]
+ train/ActionL1Loss=0.1240
+ throughput/total_tokens=76,224,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=398/500000]
+ train/ActionL1Loss=0.1646
+ throughput/total_tokens=76,416,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=399/500000]
+ train/ActionL1Loss=0.1382
+ throughput/total_tokens=76,608,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=400/500000]
+ optim/total_grad_norm=18.10
+ train/ActionL1Loss=0.1686
+ throughput/total_tokens=76,800,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=401/500000]
+ train/ActionL1Loss=0.1357
+ throughput/total_tokens=76,992,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=402/500000]
+ train/ActionL1Loss=0.1280
+ throughput/total_tokens=77,184,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=403/500000]
+ train/ActionL1Loss=0.1234
+ throughput/total_tokens=77,376,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=404/500000]
+ train/ActionL1Loss=0.1386
+ throughput/total_tokens=77,568,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=405/500000]
+ train/ActionL1Loss=0.1393
+ throughput/total_tokens=77,760,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=406/500000]
+ train/ActionL1Loss=0.1230
+ throughput/total_tokens=77,952,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=407/500000]
+ train/ActionL1Loss=0.1340
+ throughput/total_tokens=78,144,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=408/500000]
+ train/ActionL1Loss=0.1342
+ throughput/total_tokens=78,336,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=409/500000]
+ train/ActionL1Loss=0.1527
+ throughput/total_tokens=78,528,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=410/500000]
+ train/ActionL1Loss=0.1354
+ throughput/total_tokens=78,720,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=411/500000]
+ train/ActionL1Loss=0.1215
+ throughput/total_tokens=78,912,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=412/500000]
+ train/ActionL1Loss=0.1297
+ throughput/total_tokens=79,104,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=413/500000]
+ train/ActionL1Loss=0.1600
+ throughput/total_tokens=79,296,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=414/500000]
+ train/ActionL1Loss=0.1509
+ throughput/total_tokens=79,488,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=415/500000]
+ train/ActionL1Loss=0.1523
+ throughput/total_tokens=79,680,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=416/500000]
+ train/ActionL1Loss=0.1396
+ throughput/total_tokens=79,872,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=417/500000]
+ train/ActionL1Loss=0.1344
+ throughput/total_tokens=80,064,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=418/500000]
+ train/ActionL1Loss=0.1567
+ throughput/total_tokens=80,256,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=419/500000]
+ train/ActionL1Loss=0.1468
+ throughput/total_tokens=80,448,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=420/500000]
+ optim/total_grad_norm=19.84
+ train/ActionL1Loss=0.1695
+ throughput/total_tokens=80,640,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=421/500000]
+ train/ActionL1Loss=0.1524
+ throughput/total_tokens=80,832,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=422/500000]
+ train/ActionL1Loss=0.1226
+ throughput/total_tokens=81,024,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=423/500000]
+ train/ActionL1Loss=0.1410
+ throughput/total_tokens=81,216,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=424/500000]
+ train/ActionL1Loss=0.1212
+ throughput/total_tokens=81,408,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=425/500000]
+ train/ActionL1Loss=0.1439
+ throughput/total_tokens=81,600,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=426/500000]
+ train/ActionL1Loss=0.1352
+ throughput/total_tokens=81,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=427/500000]
+ train/ActionL1Loss=0.1319
+ throughput/total_tokens=81,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=428/500000]
+ train/ActionL1Loss=0.1517
+ throughput/total_tokens=82,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=429/500000]
+ train/ActionL1Loss=0.1345
+ throughput/total_tokens=82,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=430/500000]
+ train/ActionL1Loss=0.1273
+ throughput/total_tokens=82,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=431/500000]
+ train/ActionL1Loss=0.1346
+ throughput/total_tokens=82,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=432/500000]
+ train/ActionL1Loss=0.1262
+ throughput/total_tokens=82,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=433/500000]
+ train/ActionL1Loss=0.1413
+ throughput/total_tokens=83,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=434/500000]
+ train/ActionL1Loss=0.1305
+ throughput/total_tokens=83,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=435/500000]
+ train/ActionL1Loss=0.1241
+ throughput/total_tokens=83,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=436/500000]
+ train/ActionL1Loss=0.1299
+ throughput/total_tokens=83,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=437/500000]
+ train/ActionL1Loss=0.1376
+ throughput/total_tokens=83,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=438/500000]
+ train/ActionL1Loss=0.1107
+ throughput/total_tokens=84,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=439/500000]
+ train/ActionL1Loss=0.1234
+ throughput/total_tokens=84,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=440/500000]
+ optim/total_grad_norm=15.79
+ train/ActionL1Loss=0.1329
+ throughput/total_tokens=84,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=441/500000]
+ train/ActionL1Loss=0.1224
+ throughput/total_tokens=84,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=442/500000]
+ train/ActionL1Loss=0.1325
+ throughput/total_tokens=84,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=443/500000]
+ train/ActionL1Loss=0.1304
+ throughput/total_tokens=85,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=444/500000]
+ train/ActionL1Loss=0.1429
+ throughput/total_tokens=85,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=445/500000]
+ train/ActionL1Loss=0.1519
+ throughput/total_tokens=85,440,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=446/500000]
+ train/ActionL1Loss=0.1577
+ throughput/total_tokens=85,632,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=447/500000]
+ train/ActionL1Loss=0.1334
+ throughput/total_tokens=85,824,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=448/500000]
+ train/ActionL1Loss=0.1163
+ throughput/total_tokens=86,016,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=449/500000]
+ train/ActionL1Loss=0.1291
+ throughput/total_tokens=86,208,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=450/500000]
+ train/ActionL1Loss=0.1222
+ throughput/total_tokens=86,400,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=451/500000]
+ train/ActionL1Loss=0.1527
+ throughput/total_tokens=86,592,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=452/500000]
+ train/ActionL1Loss=0.1450
+ throughput/total_tokens=86,784,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=453/500000]
+ train/ActionL1Loss=0.1326
+ throughput/total_tokens=86,976,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=454/500000]
+ train/ActionL1Loss=0.1348
+ throughput/total_tokens=87,168,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=455/500000]
+ train/ActionL1Loss=0.1356
+ throughput/total_tokens=87,360,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=456/500000]
+ train/ActionL1Loss=0.1540
+ throughput/total_tokens=87,552,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=457/500000]
+ train/ActionL1Loss=0.1315
+ throughput/total_tokens=87,744,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=458/500000]
+ train/ActionL1Loss=0.1298
+ throughput/total_tokens=87,936,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=459/500000]
+ train/ActionL1Loss=0.1470
+ throughput/total_tokens=88,128,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=460/500000]
+ optim/total_grad_norm=18.70
+ train/ActionL1Loss=0.1561
+ throughput/total_tokens=88,320,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=461/500000]
+ train/ActionL1Loss=0.1340
+ throughput/total_tokens=88,512,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=462/500000]
+ train/ActionL1Loss=0.1615
+ throughput/total_tokens=88,704,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=463/500000]
+ train/ActionL1Loss=0.1331
+ throughput/total_tokens=88,896,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=464/500000]
+ train/ActionL1Loss=0.1411
+ throughput/total_tokens=89,088,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=465/500000]
+ train/ActionL1Loss=0.1383
+ throughput/total_tokens=89,280,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=466/500000]
+ train/ActionL1Loss=0.1358
+ throughput/total_tokens=89,472,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=467/500000]
+ train/ActionL1Loss=0.1343
+ throughput/total_tokens=89,664,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=468/500000]
+ train/ActionL1Loss=0.1518
+ throughput/total_tokens=89,856,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=469/500000]
+ train/ActionL1Loss=0.1565
+ throughput/total_tokens=90,048,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=470/500000]
+ train/ActionL1Loss=0.1324
+ throughput/total_tokens=90,240,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=471/500000]
+ train/ActionL1Loss=0.1470
+ throughput/total_tokens=90,432,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=472/500000]
+ train/ActionL1Loss=0.1375
+ throughput/total_tokens=90,624,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=473/500000]
+ train/ActionL1Loss=0.1543
+ throughput/total_tokens=90,816,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=474/500000]
+ train/ActionL1Loss=0.1885
+ throughput/total_tokens=91,008,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=475/500000]
+ train/ActionL1Loss=0.1503
+ throughput/total_tokens=91,200,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=476/500000]
+ train/ActionL1Loss=0.1367
+ throughput/total_tokens=91,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=477/500000]
+ train/ActionL1Loss=0.1445
+ throughput/total_tokens=91,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=478/500000]
+ train/ActionL1Loss=0.1579
+ throughput/total_tokens=91,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=479/500000]
+ train/ActionL1Loss=0.1227
+ throughput/total_tokens=91,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=480/500000]
+ optim/total_grad_norm=16.09
+ train/ActionL1Loss=0.1228
+ throughput/total_tokens=92,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=481/500000]
+ train/ActionL1Loss=0.1405
+ throughput/total_tokens=92,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=482/500000]
+ train/ActionL1Loss=0.1512
+ throughput/total_tokens=92,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=483/500000]
+ train/ActionL1Loss=0.1600
+ throughput/total_tokens=92,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=484/500000]
+ train/ActionL1Loss=0.1209
+ throughput/total_tokens=92,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=485/500000]
+ train/ActionL1Loss=0.1550
+ throughput/total_tokens=93,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=486/500000]
+ train/ActionL1Loss=0.1126
+ throughput/total_tokens=93,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=487/500000]
+ train/ActionL1Loss=0.1264
+ throughput/total_tokens=93,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=488/500000]
+ train/ActionL1Loss=0.1221
+ throughput/total_tokens=93,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=489/500000]
+ train/ActionL1Loss=0.1483
+ throughput/total_tokens=93,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=490/500000]
+ train/ActionL1Loss=0.1242
+ throughput/total_tokens=94,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=491/500000]
+ train/ActionL1Loss=0.1495
+ throughput/total_tokens=94,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=492/500000]
+ train/ActionL1Loss=0.1325
+ throughput/total_tokens=94,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=493/500000]
+ train/ActionL1Loss=0.1283
+ throughput/total_tokens=94,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=494/500000]
+ train/ActionL1Loss=0.1364
+ throughput/total_tokens=94,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=495/500000]
+ train/ActionL1Loss=0.1137
+ throughput/total_tokens=95,040,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=496/500000]
+ train/ActionL1Loss=0.1229
+ throughput/total_tokens=95,232,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=497/500000]
+ train/ActionL1Loss=0.1226
+ throughput/total_tokens=95,424,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=498/500000]
+ train/ActionL1Loss=0.1268
+ throughput/total_tokens=95,616,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=499/500000]
+ train/ActionL1Loss=0.1479
+ throughput/total_tokens=95,808,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=500/500000]
+ optim/total_grad_norm=16.53
+ train/ActionL1Loss=0.1460
+ throughput/total_tokens=96,000,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+10/02 [19:28:36] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: warnings.py:109
+ FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and
+ set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc:
+ https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial:
+ https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html .
+ warnings.warn(
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:860: UserWarning: warnings.py:109
+ `_get_pg_default_device` will be deprecated, it only stays for backward-compatiblity reason. If you need to find a device for object
+ collectives, please use `_get_object_coll_device`. If you need to query the device types supported by group, please use
+ `_device_capability(group)`.
+ warnings.warn(
+
+10/02 [19:28:39] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:722: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ local_shape = tensor.shape
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:739: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.shape,
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:741: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.dtype,
+
+10/02 [19:28:43] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/overrides.py:1747: FutureWarning: Please use DTensor warnings.py:109
+ instead and we are deprecating ShardedTensor.
+ result = torch_func_method(public_api, types, args, kwargs)
+
+10/02 [19:29:11] INFO | >> Saving config... checkpoint.py:608
+10/02 [19:29:42] INFO | >> Saving model state... checkpoint.py:796
+10/02 [19:30:56] INFO | >> Saving optim state... checkpoint.py:811
+10/02 [19:32:27] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=501/500000]
+ train/ActionL1Loss=0.1257
+ throughput/total_tokens=96,192,000
+ throughput/device/tokens_per_second=1,219
+ throughput/device/batches_per_second=0.0508
+[step=502/500000]
+ train/ActionL1Loss=0.1221
+ throughput/total_tokens=96,384,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=503/500000]
+ train/ActionL1Loss=0.1603
+ throughput/total_tokens=96,576,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=504/500000]
+ train/ActionL1Loss=0.1755
+ throughput/total_tokens=96,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=505/500000]
+ train/ActionL1Loss=0.1496
+ throughput/total_tokens=96,960,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=506/500000]
+ train/ActionL1Loss=0.1512
+ throughput/total_tokens=97,152,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=507/500000]
+ train/ActionL1Loss=0.1232
+ throughput/total_tokens=97,344,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+[step=508/500000]
+ train/ActionL1Loss=0.1525
+ throughput/total_tokens=97,536,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=509/500000]
+ train/ActionL1Loss=0.1239
+ throughput/total_tokens=97,728,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=510/500000]
+ train/ActionL1Loss=0.1419
+ throughput/total_tokens=97,920,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+ System/Peak GPU Memory (MB)=46,917
+[step=511/500000]
+ train/ActionL1Loss=0.1361
+ throughput/total_tokens=98,112,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=512/500000]
+ train/ActionL1Loss=0.1485
+ throughput/total_tokens=98,304,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=513/500000]
+ train/ActionL1Loss=0.1396
+ throughput/total_tokens=98,496,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=514/500000]
+ train/ActionL1Loss=0.1383
+ throughput/total_tokens=98,688,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=515/500000]
+ train/ActionL1Loss=0.1242
+ throughput/total_tokens=98,880,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=516/500000]
+ train/ActionL1Loss=0.1339
+ throughput/total_tokens=99,072,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=517/500000]
+ train/ActionL1Loss=0.1476
+ throughput/total_tokens=99,264,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=518/500000]
+ train/ActionL1Loss=0.1534
+ throughput/total_tokens=99,456,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=519/500000]
+ train/ActionL1Loss=0.1332
+ throughput/total_tokens=99,648,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=520/500000]
+ optim/total_grad_norm=17.21
+ train/ActionL1Loss=0.1278
+ throughput/total_tokens=99,840,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=521/500000]
+ train/ActionL1Loss=0.1541
+ throughput/total_tokens=100,032,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=522/500000]
+ train/ActionL1Loss=0.1415
+ throughput/total_tokens=100,224,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=523/500000]
+ train/ActionL1Loss=0.1399
+ throughput/total_tokens=100,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=524/500000]
+ train/ActionL1Loss=0.1330
+ throughput/total_tokens=100,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=525/500000]
+ train/ActionL1Loss=0.1521
+ throughput/total_tokens=100,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=526/500000]
+ train/ActionL1Loss=0.1821
+ throughput/total_tokens=100,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=527/500000]
+ train/ActionL1Loss=0.1325
+ throughput/total_tokens=101,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=528/500000]
+ train/ActionL1Loss=0.1408
+ throughput/total_tokens=101,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=529/500000]
+ train/ActionL1Loss=0.1500
+ throughput/total_tokens=101,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=530/500000]
+ train/ActionL1Loss=0.1500
+ throughput/total_tokens=101,760,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=531/500000]
+ train/ActionL1Loss=0.1162
+ throughput/total_tokens=101,952,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=532/500000]
+ train/ActionL1Loss=0.1229
+ throughput/total_tokens=102,144,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=533/500000]
+ train/ActionL1Loss=0.1143
+ throughput/total_tokens=102,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=534/500000]
+ train/ActionL1Loss=0.1529
+ throughput/total_tokens=102,528,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=535/500000]
+ train/ActionL1Loss=0.1234
+ throughput/total_tokens=102,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=536/500000]
+ train/ActionL1Loss=0.1788
+ throughput/total_tokens=102,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=537/500000]
+ train/ActionL1Loss=0.1368
+ throughput/total_tokens=103,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=538/500000]
+ train/ActionL1Loss=0.1414
+ throughput/total_tokens=103,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=539/500000]
+ train/ActionL1Loss=0.1474
+ throughput/total_tokens=103,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=540/500000]
+ optim/total_grad_norm=16.17
+ train/ActionL1Loss=0.1374
+ throughput/total_tokens=103,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=541/500000]
+ train/ActionL1Loss=0.1425
+ throughput/total_tokens=103,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=542/500000]
+ train/ActionL1Loss=0.1513
+ throughput/total_tokens=104,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=543/500000]
+ train/ActionL1Loss=0.1404
+ throughput/total_tokens=104,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=544/500000]
+ train/ActionL1Loss=0.1234
+ throughput/total_tokens=104,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=545/500000]
+ train/ActionL1Loss=0.1348
+ throughput/total_tokens=104,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=546/500000]
+ train/ActionL1Loss=0.1458
+ throughput/total_tokens=104,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=547/500000]
+ train/ActionL1Loss=0.1447
+ throughput/total_tokens=105,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=548/500000]
+ train/ActionL1Loss=0.1217
+ throughput/total_tokens=105,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=549/500000]
+ train/ActionL1Loss=0.1170
+ throughput/total_tokens=105,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=550/500000]
+ train/ActionL1Loss=0.1297
+ throughput/total_tokens=105,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=551/500000]
+ train/ActionL1Loss=0.1227
+ throughput/total_tokens=105,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=552/500000]
+ train/ActionL1Loss=0.1307
+ throughput/total_tokens=105,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=553/500000]
+ train/ActionL1Loss=0.1298
+ throughput/total_tokens=106,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=554/500000]
+ train/ActionL1Loss=0.1714
+ throughput/total_tokens=106,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=555/500000]
+ train/ActionL1Loss=0.1533
+ throughput/total_tokens=106,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=556/500000]
+ train/ActionL1Loss=0.1369
+ throughput/total_tokens=106,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=557/500000]
+ train/ActionL1Loss=0.1289
+ throughput/total_tokens=106,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=558/500000]
+ train/ActionL1Loss=0.1280
+ throughput/total_tokens=107,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=559/500000]
+ train/ActionL1Loss=0.1382
+ throughput/total_tokens=107,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=560/500000]
+ optim/total_grad_norm=15.57
+ train/ActionL1Loss=0.1503
+ throughput/total_tokens=107,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=561/500000]
+ train/ActionL1Loss=0.1216
+ throughput/total_tokens=107,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=562/500000]
+ train/ActionL1Loss=0.1180
+ throughput/total_tokens=107,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=563/500000]
+ train/ActionL1Loss=0.1344
+ throughput/total_tokens=108,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=564/500000]
+ train/ActionL1Loss=0.1453
+ throughput/total_tokens=108,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=565/500000]
+ train/ActionL1Loss=0.1295
+ throughput/total_tokens=108,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=566/500000]
+ train/ActionL1Loss=0.1323
+ throughput/total_tokens=108,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=567/500000]
+ train/ActionL1Loss=0.1703
+ throughput/total_tokens=108,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=568/500000]
+ train/ActionL1Loss=0.1089
+ throughput/total_tokens=109,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=569/500000]
+ train/ActionL1Loss=0.1274
+ throughput/total_tokens=109,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=570/500000]
+ train/ActionL1Loss=0.1319
+ throughput/total_tokens=109,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=571/500000]
+ train/ActionL1Loss=0.1223
+ throughput/total_tokens=109,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=572/500000]
+ train/ActionL1Loss=0.1265
+ throughput/total_tokens=109,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=573/500000]
+ train/ActionL1Loss=0.1243
+ throughput/total_tokens=110,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=574/500000]
+ train/ActionL1Loss=0.1417
+ throughput/total_tokens=110,208,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=575/500000]
+ train/ActionL1Loss=0.1208
+ throughput/total_tokens=110,400,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=576/500000]
+ train/ActionL1Loss=0.1443
+ throughput/total_tokens=110,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=577/500000]
+ train/ActionL1Loss=0.1365
+ throughput/total_tokens=110,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=578/500000]
+ train/ActionL1Loss=0.1656
+ throughput/total_tokens=110,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=579/500000]
+ train/ActionL1Loss=0.1367
+ throughput/total_tokens=111,168,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=580/500000]
+ optim/total_grad_norm=17.43
+ train/ActionL1Loss=0.1682
+ throughput/total_tokens=111,360,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=581/500000]
+ train/ActionL1Loss=0.1345
+ throughput/total_tokens=111,552,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=582/500000]
+ train/ActionL1Loss=0.1527
+ throughput/total_tokens=111,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=583/500000]
+ train/ActionL1Loss=0.1561
+ throughput/total_tokens=111,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=584/500000]
+ train/ActionL1Loss=0.1267
+ throughput/total_tokens=112,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=585/500000]
+ train/ActionL1Loss=0.1488
+ throughput/total_tokens=112,320,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=586/500000]
+ train/ActionL1Loss=0.1325
+ throughput/total_tokens=112,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=587/500000]
+ train/ActionL1Loss=0.1260
+ throughput/total_tokens=112,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=588/500000]
+ train/ActionL1Loss=0.1571
+ throughput/total_tokens=112,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=589/500000]
+ train/ActionL1Loss=0.1273
+ throughput/total_tokens=113,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=590/500000]
+ train/ActionL1Loss=0.1447
+ throughput/total_tokens=113,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=591/500000]
+ train/ActionL1Loss=0.1366
+ throughput/total_tokens=113,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=592/500000]
+ train/ActionL1Loss=0.1478
+ throughput/total_tokens=113,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=593/500000]
+ train/ActionL1Loss=0.1542
+ throughput/total_tokens=113,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=594/500000]
+ train/ActionL1Loss=0.1221
+ throughput/total_tokens=114,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=595/500000]
+ train/ActionL1Loss=0.1390
+ throughput/total_tokens=114,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=596/500000]
+ train/ActionL1Loss=0.1554
+ throughput/total_tokens=114,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=597/500000]
+ train/ActionL1Loss=0.1366
+ throughput/total_tokens=114,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=598/500000]
+ train/ActionL1Loss=0.1228
+ throughput/total_tokens=114,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=599/500000]
+ train/ActionL1Loss=0.1290
+ throughput/total_tokens=115,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=600/500000]
+ optim/total_grad_norm=12.86
+ train/ActionL1Loss=0.1194
+ throughput/total_tokens=115,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=601/500000]
+ train/ActionL1Loss=0.1409
+ throughput/total_tokens=115,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=602/500000]
+ train/ActionL1Loss=0.1287
+ throughput/total_tokens=115,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=603/500000]
+ train/ActionL1Loss=0.1244
+ throughput/total_tokens=115,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=604/500000]
+ train/ActionL1Loss=0.1237
+ throughput/total_tokens=115,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=605/500000]
+ train/ActionL1Loss=0.1323
+ throughput/total_tokens=116,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=606/500000]
+ train/ActionL1Loss=0.1178
+ throughput/total_tokens=116,352,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=607/500000]
+ train/ActionL1Loss=0.1148
+ throughput/total_tokens=116,544,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=608/500000]
+ train/ActionL1Loss=0.1420
+ throughput/total_tokens=116,736,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=609/500000]
+ train/ActionL1Loss=0.1428
+ throughput/total_tokens=116,928,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=610/500000]
+ train/ActionL1Loss=0.1206
+ throughput/total_tokens=117,120,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=611/500000]
+ train/ActionL1Loss=0.1550
+ throughput/total_tokens=117,312,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=612/500000]
+ train/ActionL1Loss=0.1342
+ throughput/total_tokens=117,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=613/500000]
+ train/ActionL1Loss=0.1180
+ throughput/total_tokens=117,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=614/500000]
+ train/ActionL1Loss=0.1531
+ throughput/total_tokens=117,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=615/500000]
+ train/ActionL1Loss=0.1559
+ throughput/total_tokens=118,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=616/500000]
+ train/ActionL1Loss=0.1192
+ throughput/total_tokens=118,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=617/500000]
+ train/ActionL1Loss=0.1160
+ throughput/total_tokens=118,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=618/500000]
+ train/ActionL1Loss=0.1273
+ throughput/total_tokens=118,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=619/500000]
+ train/ActionL1Loss=0.1516
+ throughput/total_tokens=118,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=620/500000]
+ optim/total_grad_norm=15.81
+ train/ActionL1Loss=0.1397
+ throughput/total_tokens=119,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=621/500000]
+ train/ActionL1Loss=0.1388
+ throughput/total_tokens=119,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=622/500000]
+ train/ActionL1Loss=0.1362
+ throughput/total_tokens=119,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=623/500000]
+ train/ActionL1Loss=0.1278
+ throughput/total_tokens=119,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=624/500000]
+ train/ActionL1Loss=0.1316
+ throughput/total_tokens=119,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=625/500000]
+ train/ActionL1Loss=0.1485
+ throughput/total_tokens=120,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=626/500000]
+ train/ActionL1Loss=0.1260
+ throughput/total_tokens=120,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=627/500000]
+ train/ActionL1Loss=0.1398
+ throughput/total_tokens=120,384,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=628/500000]
+ train/ActionL1Loss=0.1356
+ throughput/total_tokens=120,576,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=629/500000]
+ train/ActionL1Loss=0.1445
+ throughput/total_tokens=120,768,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=630/500000]
+ train/ActionL1Loss=0.1388
+ throughput/total_tokens=120,960,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=631/500000]
+ train/ActionL1Loss=0.1399
+ throughput/total_tokens=121,152,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=632/500000]
+ train/ActionL1Loss=0.1308
+ throughput/total_tokens=121,344,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=633/500000]
+ train/ActionL1Loss=0.1414
+ throughput/total_tokens=121,536,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=634/500000]
+ train/ActionL1Loss=0.1378
+ throughput/total_tokens=121,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=635/500000]
+ train/ActionL1Loss=0.1311
+ throughput/total_tokens=121,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=636/500000]
+ train/ActionL1Loss=0.1158
+ throughput/total_tokens=122,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=637/500000]
+ train/ActionL1Loss=0.1505
+ throughput/total_tokens=122,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=638/500000]
+ train/ActionL1Loss=0.1273
+ throughput/total_tokens=122,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=639/500000]
+ train/ActionL1Loss=0.1389
+ throughput/total_tokens=122,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=640/500000]
+ optim/total_grad_norm=16.39
+ train/ActionL1Loss=0.1349
+ throughput/total_tokens=122,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=641/500000]
+ train/ActionL1Loss=0.1395
+ throughput/total_tokens=123,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=642/500000]
+ train/ActionL1Loss=0.1222
+ throughput/total_tokens=123,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=643/500000]
+ train/ActionL1Loss=0.1466
+ throughput/total_tokens=123,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=644/500000]
+ train/ActionL1Loss=0.1284
+ throughput/total_tokens=123,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=645/500000]
+ train/ActionL1Loss=0.1145
+ throughput/total_tokens=123,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=646/500000]
+ train/ActionL1Loss=0.1341
+ throughput/total_tokens=124,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=647/500000]
+ train/ActionL1Loss=0.1354
+ throughput/total_tokens=124,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=648/500000]
+ train/ActionL1Loss=0.1336
+ throughput/total_tokens=124,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=649/500000]
+ train/ActionL1Loss=0.0948
+ throughput/total_tokens=124,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=650/500000]
+ train/ActionL1Loss=0.1321
+ throughput/total_tokens=124,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=651/500000]
+ train/ActionL1Loss=0.1401
+ throughput/total_tokens=124,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=652/500000]
+ train/ActionL1Loss=0.1381
+ throughput/total_tokens=125,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=653/500000]
+ train/ActionL1Loss=0.1298
+ throughput/total_tokens=125,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=654/500000]
+ train/ActionL1Loss=0.1401
+ throughput/total_tokens=125,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=655/500000]
+ train/ActionL1Loss=0.1237
+ throughput/total_tokens=125,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=656/500000]
+ train/ActionL1Loss=0.1283
+ throughput/total_tokens=125,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=657/500000]
+ train/ActionL1Loss=0.1328
+ throughput/total_tokens=126,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=658/500000]
+ train/ActionL1Loss=0.1299
+ throughput/total_tokens=126,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=659/500000]
+ train/ActionL1Loss=0.1398
+ throughput/total_tokens=126,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=660/500000]
+ optim/total_grad_norm=13.81
+ train/ActionL1Loss=0.1259
+ throughput/total_tokens=126,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=661/500000]
+ train/ActionL1Loss=0.1152
+ throughput/total_tokens=126,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=662/500000]
+ train/ActionL1Loss=0.1384
+ throughput/total_tokens=127,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=663/500000]
+ train/ActionL1Loss=0.1568
+ throughput/total_tokens=127,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=664/500000]
+ train/ActionL1Loss=0.1171
+ throughput/total_tokens=127,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=665/500000]
+ train/ActionL1Loss=0.1380
+ throughput/total_tokens=127,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=666/500000]
+ train/ActionL1Loss=0.1253
+ throughput/total_tokens=127,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=667/500000]
+ train/ActionL1Loss=0.1366
+ throughput/total_tokens=128,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=668/500000]
+ train/ActionL1Loss=0.0958
+ throughput/total_tokens=128,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=669/500000]
+ train/ActionL1Loss=0.1254
+ throughput/total_tokens=128,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=670/500000]
+ train/ActionL1Loss=0.1491
+ throughput/total_tokens=128,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=671/500000]
+ train/ActionL1Loss=0.1294
+ throughput/total_tokens=128,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=672/500000]
+ train/ActionL1Loss=0.1368
+ throughput/total_tokens=129,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=673/500000]
+ train/ActionL1Loss=0.1651
+ throughput/total_tokens=129,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=674/500000]
+ train/ActionL1Loss=0.1200
+ throughput/total_tokens=129,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=675/500000]
+ train/ActionL1Loss=0.1265
+ throughput/total_tokens=129,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=676/500000]
+ train/ActionL1Loss=0.1435
+ throughput/total_tokens=129,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=677/500000]
+ train/ActionL1Loss=0.1244
+ throughput/total_tokens=129,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=678/500000]
+ train/ActionL1Loss=0.1163
+ throughput/total_tokens=130,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=679/500000]
+ train/ActionL1Loss=0.1169
+ throughput/total_tokens=130,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=680/500000]
+ optim/total_grad_norm=13.12
+ train/ActionL1Loss=0.1136
+ throughput/total_tokens=130,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=681/500000]
+ train/ActionL1Loss=0.1220
+ throughput/total_tokens=130,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=682/500000]
+ train/ActionL1Loss=0.1196
+ throughput/total_tokens=130,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=683/500000]
+ train/ActionL1Loss=0.1556
+ throughput/total_tokens=131,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=684/500000]
+ train/ActionL1Loss=0.1485
+ throughput/total_tokens=131,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=685/500000]
+ train/ActionL1Loss=0.1258
+ throughput/total_tokens=131,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=686/500000]
+ train/ActionL1Loss=0.1236
+ throughput/total_tokens=131,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=687/500000]
+ train/ActionL1Loss=0.1225
+ throughput/total_tokens=131,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=688/500000]
+ train/ActionL1Loss=0.1239
+ throughput/total_tokens=132,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=689/500000]
+ train/ActionL1Loss=0.1361
+ throughput/total_tokens=132,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=690/500000]
+ train/ActionL1Loss=0.1290
+ throughput/total_tokens=132,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=691/500000]
+ train/ActionL1Loss=0.0972
+ throughput/total_tokens=132,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=692/500000]
+ train/ActionL1Loss=0.1122
+ throughput/total_tokens=132,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=693/500000]
+ train/ActionL1Loss=0.1597
+ throughput/total_tokens=133,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=694/500000]
+ train/ActionL1Loss=0.1600
+ throughput/total_tokens=133,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=695/500000]
+ train/ActionL1Loss=0.1123
+ throughput/total_tokens=133,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=696/500000]
+ train/ActionL1Loss=0.1203
+ throughput/total_tokens=133,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=697/500000]
+ train/ActionL1Loss=0.1589
+ throughput/total_tokens=133,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=698/500000]
+ train/ActionL1Loss=0.1176
+ throughput/total_tokens=134,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=699/500000]
+ train/ActionL1Loss=0.1154
+ throughput/total_tokens=134,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=700/500000]
+ optim/total_grad_norm=15.14
+ train/ActionL1Loss=0.1163
+ throughput/total_tokens=134,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=701/500000]
+ train/ActionL1Loss=0.1347
+ throughput/total_tokens=134,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=702/500000]
+ train/ActionL1Loss=0.1191
+ throughput/total_tokens=134,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=703/500000]
+ train/ActionL1Loss=0.1325
+ throughput/total_tokens=134,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=704/500000]
+ train/ActionL1Loss=0.1048
+ throughput/total_tokens=135,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=705/500000]
+ train/ActionL1Loss=0.1498
+ throughput/total_tokens=135,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=706/500000]
+ train/ActionL1Loss=0.1452
+ throughput/total_tokens=135,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=707/500000]
+ train/ActionL1Loss=0.1361
+ throughput/total_tokens=135,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=708/500000]
+ train/ActionL1Loss=0.1552
+ throughput/total_tokens=135,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=709/500000]
+ train/ActionL1Loss=0.2081
+ throughput/total_tokens=136,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=710/500000]
+ train/ActionL1Loss=0.1337
+ throughput/total_tokens=136,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=711/500000]
+ train/ActionL1Loss=0.1184
+ throughput/total_tokens=136,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=712/500000]
+ train/ActionL1Loss=0.1346
+ throughput/total_tokens=136,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=713/500000]
+ train/ActionL1Loss=0.1132
+ throughput/total_tokens=136,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=714/500000]
+ train/ActionL1Loss=0.1050
+ throughput/total_tokens=137,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=715/500000]
+ train/ActionL1Loss=0.0985
+ throughput/total_tokens=137,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=716/500000]
+ train/ActionL1Loss=0.1301
+ throughput/total_tokens=137,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=717/500000]
+ train/ActionL1Loss=0.1333
+ throughput/total_tokens=137,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=718/500000]
+ train/ActionL1Loss=0.1343
+ throughput/total_tokens=137,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=719/500000]
+ train/ActionL1Loss=0.1050
+ throughput/total_tokens=138,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=720/500000]
+ optim/total_grad_norm=13.82
+ train/ActionL1Loss=0.1210
+ throughput/total_tokens=138,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=721/500000]
+ train/ActionL1Loss=0.1288
+ throughput/total_tokens=138,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=722/500000]
+ train/ActionL1Loss=0.1385
+ throughput/total_tokens=138,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=723/500000]
+ train/ActionL1Loss=0.1265
+ throughput/total_tokens=138,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=724/500000]
+ train/ActionL1Loss=0.1280
+ throughput/total_tokens=139,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=725/500000]
+ train/ActionL1Loss=0.1318
+ throughput/total_tokens=139,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=726/500000]
+ train/ActionL1Loss=0.1422
+ throughput/total_tokens=139,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=727/500000]
+ train/ActionL1Loss=0.1164
+ throughput/total_tokens=139,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=728/500000]
+ train/ActionL1Loss=0.1443
+ throughput/total_tokens=139,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=729/500000]
+ train/ActionL1Loss=0.1256
+ throughput/total_tokens=139,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=730/500000]
+ train/ActionL1Loss=0.1124
+ throughput/total_tokens=140,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=731/500000]
+ train/ActionL1Loss=0.1150
+ throughput/total_tokens=140,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=732/500000]
+ train/ActionL1Loss=0.1421
+ throughput/total_tokens=140,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=733/500000]
+ train/ActionL1Loss=0.1446
+ throughput/total_tokens=140,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=734/500000]
+ train/ActionL1Loss=0.1286
+ throughput/total_tokens=140,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=735/500000]
+ train/ActionL1Loss=0.1175
+ throughput/total_tokens=141,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=736/500000]
+ train/ActionL1Loss=0.1316
+ throughput/total_tokens=141,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=737/500000]
+ train/ActionL1Loss=0.1340
+ throughput/total_tokens=141,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=738/500000]
+ train/ActionL1Loss=0.1325
+ throughput/total_tokens=141,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=739/500000]
+ train/ActionL1Loss=0.1343
+ throughput/total_tokens=141,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=740/500000]
+ optim/total_grad_norm=12.77
+ train/ActionL1Loss=0.1572
+ throughput/total_tokens=142,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=741/500000]
+ train/ActionL1Loss=0.1509
+ throughput/total_tokens=142,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=742/500000]
+ train/ActionL1Loss=0.1333
+ throughput/total_tokens=142,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=743/500000]
+ train/ActionL1Loss=0.1289
+ throughput/total_tokens=142,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=744/500000]
+ train/ActionL1Loss=0.1837
+ throughput/total_tokens=142,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=745/500000]
+ train/ActionL1Loss=0.1428
+ throughput/total_tokens=143,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=746/500000]
+ train/ActionL1Loss=0.1485
+ throughput/total_tokens=143,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=747/500000]
+ train/ActionL1Loss=0.1350
+ throughput/total_tokens=143,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=748/500000]
+ train/ActionL1Loss=0.1237
+ throughput/total_tokens=143,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=749/500000]
+ train/ActionL1Loss=0.1131
+ throughput/total_tokens=143,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=750/500000]
+ train/ActionL1Loss=0.1290
+ throughput/total_tokens=144,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=751/500000]
+ train/ActionL1Loss=0.1076
+ throughput/total_tokens=144,192,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=752/500000]
+ train/ActionL1Loss=0.1243
+ throughput/total_tokens=144,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=753/500000]
+ train/ActionL1Loss=0.1259
+ throughput/total_tokens=144,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=754/500000]
+ train/ActionL1Loss=0.1226
+ throughput/total_tokens=144,768,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=755/500000]
+ train/ActionL1Loss=0.1259
+ throughput/total_tokens=144,960,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=756/500000]
+ train/ActionL1Loss=0.1277
+ throughput/total_tokens=145,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=757/500000]
+ train/ActionL1Loss=0.1266
+ throughput/total_tokens=145,344,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=758/500000]
+ train/ActionL1Loss=0.1313
+ throughput/total_tokens=145,536,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=759/500000]
+ train/ActionL1Loss=0.1267
+ throughput/total_tokens=145,728,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=760/500000]
+ optim/total_grad_norm=12.64
+ train/ActionL1Loss=0.1057
+ throughput/total_tokens=145,920,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=761/500000]
+ train/ActionL1Loss=0.1338
+ throughput/total_tokens=146,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=762/500000]
+ train/ActionL1Loss=0.1116
+ throughput/total_tokens=146,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=763/500000]
+ train/ActionL1Loss=0.1215
+ throughput/total_tokens=146,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=764/500000]
+ train/ActionL1Loss=0.1392
+ throughput/total_tokens=146,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=765/500000]
+ train/ActionL1Loss=0.1081
+ throughput/total_tokens=146,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=766/500000]
+ train/ActionL1Loss=0.1150
+ throughput/total_tokens=147,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=767/500000]
+ train/ActionL1Loss=0.1220
+ throughput/total_tokens=147,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=768/500000]
+ train/ActionL1Loss=0.1106
+ throughput/total_tokens=147,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=769/500000]
+ train/ActionL1Loss=0.1158
+ throughput/total_tokens=147,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=770/500000]
+ train/ActionL1Loss=0.1250
+ throughput/total_tokens=147,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=771/500000]
+ train/ActionL1Loss=0.1018
+ throughput/total_tokens=148,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=772/500000]
+ train/ActionL1Loss=0.1060
+ throughput/total_tokens=148,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=773/500000]
+ train/ActionL1Loss=0.1021
+ throughput/total_tokens=148,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=774/500000]
+ train/ActionL1Loss=0.0958
+ throughput/total_tokens=148,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=775/500000]
+ train/ActionL1Loss=0.1088
+ throughput/total_tokens=148,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=776/500000]
+ train/ActionL1Loss=0.1063
+ throughput/total_tokens=148,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=777/500000]
+ train/ActionL1Loss=0.0835
+ throughput/total_tokens=149,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=778/500000]
+ train/ActionL1Loss=0.1127
+ throughput/total_tokens=149,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=779/500000]
+ train/ActionL1Loss=0.1090
+ throughput/total_tokens=149,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=780/500000]
+ optim/total_grad_norm=10.79
+ train/ActionL1Loss=0.0907
+ throughput/total_tokens=149,760,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=781/500000]
+ train/ActionL1Loss=0.1088
+ throughput/total_tokens=149,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=782/500000]
+ train/ActionL1Loss=0.1158
+ throughput/total_tokens=150,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=783/500000]
+ train/ActionL1Loss=0.1149
+ throughput/total_tokens=150,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=784/500000]
+ train/ActionL1Loss=0.1197
+ throughput/total_tokens=150,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=785/500000]
+ train/ActionL1Loss=0.1247
+ throughput/total_tokens=150,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=786/500000]
+ train/ActionL1Loss=0.1430
+ throughput/total_tokens=150,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=787/500000]
+ train/ActionL1Loss=0.1276
+ throughput/total_tokens=151,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=788/500000]
+ train/ActionL1Loss=0.1008
+ throughput/total_tokens=151,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=789/500000]
+ train/ActionL1Loss=0.1301
+ throughput/total_tokens=151,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=790/500000]
+ train/ActionL1Loss=0.1090
+ throughput/total_tokens=151,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=791/500000]
+ train/ActionL1Loss=0.1399
+ throughput/total_tokens=151,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=792/500000]
+ train/ActionL1Loss=0.1168
+ throughput/total_tokens=152,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=793/500000]
+ train/ActionL1Loss=0.1203
+ throughput/total_tokens=152,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=794/500000]
+ train/ActionL1Loss=0.1315
+ throughput/total_tokens=152,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=795/500000]
+ train/ActionL1Loss=0.1087
+ throughput/total_tokens=152,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=796/500000]
+ train/ActionL1Loss=0.1038
+ throughput/total_tokens=152,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=797/500000]
+ train/ActionL1Loss=0.1157
+ throughput/total_tokens=153,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=798/500000]
+ train/ActionL1Loss=0.1032
+ throughput/total_tokens=153,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=799/500000]
+ train/ActionL1Loss=0.1121
+ throughput/total_tokens=153,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=800/500000]
+ optim/total_grad_norm=11.14
+ train/ActionL1Loss=0.1309
+ throughput/total_tokens=153,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=801/500000]
+ train/ActionL1Loss=0.1155
+ throughput/total_tokens=153,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=802/500000]
+ train/ActionL1Loss=0.1271
+ throughput/total_tokens=153,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=803/500000]
+ train/ActionL1Loss=0.1301
+ throughput/total_tokens=154,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=804/500000]
+ train/ActionL1Loss=0.1089
+ throughput/total_tokens=154,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=805/500000]
+ train/ActionL1Loss=0.1403
+ throughput/total_tokens=154,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=806/500000]
+ train/ActionL1Loss=0.1309
+ throughput/total_tokens=154,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=807/500000]
+ train/ActionL1Loss=0.1121
+ throughput/total_tokens=154,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=808/500000]
+ train/ActionL1Loss=0.1275
+ throughput/total_tokens=155,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=809/500000]
+ train/ActionL1Loss=0.1290
+ throughput/total_tokens=155,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=810/500000]
+ train/ActionL1Loss=0.1122
+ throughput/total_tokens=155,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=811/500000]
+ train/ActionL1Loss=0.1098
+ throughput/total_tokens=155,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=812/500000]
+ train/ActionL1Loss=0.1099
+ throughput/total_tokens=155,904,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=813/500000]
+ train/ActionL1Loss=0.1100
+ throughput/total_tokens=156,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=814/500000]
+ train/ActionL1Loss=0.1163
+ throughput/total_tokens=156,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=815/500000]
+ train/ActionL1Loss=0.1336
+ throughput/total_tokens=156,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=816/500000]
+ train/ActionL1Loss=0.1113
+ throughput/total_tokens=156,672,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=817/500000]
+ train/ActionL1Loss=0.1270
+ throughput/total_tokens=156,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=818/500000]
+ train/ActionL1Loss=0.0995
+ throughput/total_tokens=157,056,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=819/500000]
+ train/ActionL1Loss=0.1196
+ throughput/total_tokens=157,248,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=820/500000]
+ optim/total_grad_norm=13.42
+ train/ActionL1Loss=0.1093
+ throughput/total_tokens=157,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=821/500000]
+ train/ActionL1Loss=0.1259
+ throughput/total_tokens=157,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=822/500000]
+ train/ActionL1Loss=0.1362
+ throughput/total_tokens=157,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=823/500000]
+ train/ActionL1Loss=0.1222
+ throughput/total_tokens=158,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=824/500000]
+ train/ActionL1Loss=0.1279
+ throughput/total_tokens=158,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=825/500000]
+ train/ActionL1Loss=0.1153
+ throughput/total_tokens=158,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=826/500000]
+ train/ActionL1Loss=0.1361
+ throughput/total_tokens=158,592,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=827/500000]
+ train/ActionL1Loss=0.1374
+ throughput/total_tokens=158,784,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=828/500000]
+ train/ActionL1Loss=0.1105
+ throughput/total_tokens=158,976,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=829/500000]
+ train/ActionL1Loss=0.1207
+ throughput/total_tokens=159,168,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=830/500000]
+ train/ActionL1Loss=0.1459
+ throughput/total_tokens=159,360,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=831/500000]
+ train/ActionL1Loss=0.1234
+ throughput/total_tokens=159,552,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=832/500000]
+ train/ActionL1Loss=0.1340
+ throughput/total_tokens=159,744,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=833/500000]
+ train/ActionL1Loss=0.1313
+ throughput/total_tokens=159,936,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=834/500000]
+ train/ActionL1Loss=0.1259
+ throughput/total_tokens=160,128,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=835/500000]
+ train/ActionL1Loss=0.1350
+ throughput/total_tokens=160,320,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=836/500000]
+ train/ActionL1Loss=0.1081
+ throughput/total_tokens=160,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=837/500000]
+ train/ActionL1Loss=0.1209
+ throughput/total_tokens=160,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=838/500000]
+ train/ActionL1Loss=0.1502
+ throughput/total_tokens=160,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=839/500000]
+ train/ActionL1Loss=0.1401
+ throughput/total_tokens=161,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=840/500000]
+ optim/total_grad_norm=12.32
+ train/ActionL1Loss=0.1187
+ throughput/total_tokens=161,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=841/500000]
+ train/ActionL1Loss=0.1271
+ throughput/total_tokens=161,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=842/500000]
+ train/ActionL1Loss=0.1332
+ throughput/total_tokens=161,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=843/500000]
+ train/ActionL1Loss=0.1520
+ throughput/total_tokens=161,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=844/500000]
+ train/ActionL1Loss=0.1132
+ throughput/total_tokens=162,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=845/500000]
+ train/ActionL1Loss=0.1240
+ throughput/total_tokens=162,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=846/500000]
+ train/ActionL1Loss=0.1365
+ throughput/total_tokens=162,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=847/500000]
+ train/ActionL1Loss=0.1352
+ throughput/total_tokens=162,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=848/500000]
+ train/ActionL1Loss=0.1258
+ throughput/total_tokens=162,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=849/500000]
+ train/ActionL1Loss=0.1257
+ throughput/total_tokens=163,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=850/500000]
+ train/ActionL1Loss=0.1297
+ throughput/total_tokens=163,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=851/500000]
+ train/ActionL1Loss=0.1164
+ throughput/total_tokens=163,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=852/500000]
+ train/ActionL1Loss=0.1129
+ throughput/total_tokens=163,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=853/500000]
+ train/ActionL1Loss=0.1041
+ throughput/total_tokens=163,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=854/500000]
+ train/ActionL1Loss=0.1184
+ throughput/total_tokens=163,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=855/500000]
+ train/ActionL1Loss=0.0962
+ throughput/total_tokens=164,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=856/500000]
+ train/ActionL1Loss=0.1037
+ throughput/total_tokens=164,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=857/500000]
+ train/ActionL1Loss=0.1062
+ throughput/total_tokens=164,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=858/500000]
+ train/ActionL1Loss=0.1274
+ throughput/total_tokens=164,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=859/500000]
+ train/ActionL1Loss=0.1142
+ throughput/total_tokens=164,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=860/500000]
+ optim/total_grad_norm=13.90
+ train/ActionL1Loss=0.1150
+ throughput/total_tokens=165,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=861/500000]
+ train/ActionL1Loss=0.0988
+ throughput/total_tokens=165,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=862/500000]
+ train/ActionL1Loss=0.1111
+ throughput/total_tokens=165,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=863/500000]
+ train/ActionL1Loss=0.1173
+ throughput/total_tokens=165,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=864/500000]
+ train/ActionL1Loss=0.1387
+ throughput/total_tokens=165,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=865/500000]
+ train/ActionL1Loss=0.0985
+ throughput/total_tokens=166,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=866/500000]
+ train/ActionL1Loss=0.1169
+ throughput/total_tokens=166,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=867/500000]
+ train/ActionL1Loss=0.1167
+ throughput/total_tokens=166,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=868/500000]
+ train/ActionL1Loss=0.1164
+ throughput/total_tokens=166,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=869/500000]
+ train/ActionL1Loss=0.1051
+ throughput/total_tokens=166,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=870/500000]
+ train/ActionL1Loss=0.0987
+ throughput/total_tokens=167,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=871/500000]
+ train/ActionL1Loss=0.1445
+ throughput/total_tokens=167,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=872/500000]
+ train/ActionL1Loss=0.1221
+ throughput/total_tokens=167,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=873/500000]
+ train/ActionL1Loss=0.1224
+ throughput/total_tokens=167,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=874/500000]
+ train/ActionL1Loss=0.1046
+ throughput/total_tokens=167,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=875/500000]
+ train/ActionL1Loss=0.1073
+ throughput/total_tokens=168,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=876/500000]
+ train/ActionL1Loss=0.1134
+ throughput/total_tokens=168,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=877/500000]
+ train/ActionL1Loss=0.1208
+ throughput/total_tokens=168,384,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=878/500000]
+ train/ActionL1Loss=0.1219
+ throughput/total_tokens=168,576,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=879/500000]
+ train/ActionL1Loss=0.1312
+ throughput/total_tokens=168,768,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=880/500000]
+ optim/total_grad_norm=12.74
+ train/ActionL1Loss=0.1245
+ throughput/total_tokens=168,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=881/500000]
+ train/ActionL1Loss=0.1143
+ throughput/total_tokens=169,152,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=882/500000]
+ train/ActionL1Loss=0.1219
+ throughput/total_tokens=169,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=883/500000]
+ train/ActionL1Loss=0.0965
+ throughput/total_tokens=169,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=884/500000]
+ train/ActionL1Loss=0.0980
+ throughput/total_tokens=169,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=885/500000]
+ train/ActionL1Loss=0.1155
+ throughput/total_tokens=169,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=886/500000]
+ train/ActionL1Loss=0.1008
+ throughput/total_tokens=170,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=887/500000]
+ train/ActionL1Loss=0.1204
+ throughput/total_tokens=170,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=888/500000]
+ train/ActionL1Loss=0.1303
+ throughput/total_tokens=170,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=889/500000]
+ train/ActionL1Loss=0.1280
+ throughput/total_tokens=170,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=890/500000]
+ train/ActionL1Loss=0.1198
+ throughput/total_tokens=170,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=891/500000]
+ train/ActionL1Loss=0.1362
+ throughput/total_tokens=171,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=892/500000]
+ train/ActionL1Loss=0.1322
+ throughput/total_tokens=171,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=893/500000]
+ train/ActionL1Loss=0.1124
+ throughput/total_tokens=171,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=894/500000]
+ train/ActionL1Loss=0.1084
+ throughput/total_tokens=171,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=895/500000]
+ train/ActionL1Loss=0.1067
+ throughput/total_tokens=171,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=896/500000]
+ train/ActionL1Loss=0.1292
+ throughput/total_tokens=172,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=897/500000]
+ train/ActionL1Loss=0.1009
+ throughput/total_tokens=172,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=898/500000]
+ train/ActionL1Loss=0.1191
+ throughput/total_tokens=172,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=899/500000]
+ train/ActionL1Loss=0.1156
+ throughput/total_tokens=172,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=900/500000]
+ optim/total_grad_norm=12.68
+ train/ActionL1Loss=0.1223
+ throughput/total_tokens=172,800,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=901/500000]
+ train/ActionL1Loss=0.1072
+ throughput/total_tokens=172,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=902/500000]
+ train/ActionL1Loss=0.1222
+ throughput/total_tokens=173,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=903/500000]
+ train/ActionL1Loss=0.1276
+ throughput/total_tokens=173,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=904/500000]
+ train/ActionL1Loss=0.1030
+ throughput/total_tokens=173,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=905/500000]
+ train/ActionL1Loss=0.1210
+ throughput/total_tokens=173,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=906/500000]
+ train/ActionL1Loss=0.1018
+ throughput/total_tokens=173,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=907/500000]
+ train/ActionL1Loss=0.1259
+ throughput/total_tokens=174,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=908/500000]
+ train/ActionL1Loss=0.1948
+ throughput/total_tokens=174,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=909/500000]
+ train/ActionL1Loss=0.1180
+ throughput/total_tokens=174,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=910/500000]
+ train/ActionL1Loss=0.1626
+ throughput/total_tokens=174,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=911/500000]
+ train/ActionL1Loss=0.1169
+ throughput/total_tokens=174,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=912/500000]
+ train/ActionL1Loss=0.1375
+ throughput/total_tokens=175,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=913/500000]
+ train/ActionL1Loss=0.1378
+ throughput/total_tokens=175,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=914/500000]
+ train/ActionL1Loss=0.1564
+ throughput/total_tokens=175,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=915/500000]
+ train/ActionL1Loss=0.1422
+ throughput/total_tokens=175,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=916/500000]
+ train/ActionL1Loss=0.1281
+ throughput/total_tokens=175,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=917/500000]
+ train/ActionL1Loss=0.1345
+ throughput/total_tokens=176,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=918/500000]
+ train/ActionL1Loss=0.1248
+ throughput/total_tokens=176,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=919/500000]
+ train/ActionL1Loss=0.1216
+ throughput/total_tokens=176,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=920/500000]
+ optim/total_grad_norm=12.36
+ train/ActionL1Loss=0.1258
+ throughput/total_tokens=176,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=921/500000]
+ train/ActionL1Loss=0.1220
+ throughput/total_tokens=176,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=922/500000]
+ train/ActionL1Loss=0.1217
+ throughput/total_tokens=177,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=923/500000]
+ train/ActionL1Loss=0.1041
+ throughput/total_tokens=177,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=924/500000]
+ train/ActionL1Loss=0.1365
+ throughput/total_tokens=177,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=925/500000]
+ train/ActionL1Loss=0.1317
+ throughput/total_tokens=177,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=926/500000]
+ train/ActionL1Loss=0.1278
+ throughput/total_tokens=177,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=927/500000]
+ train/ActionL1Loss=0.1177
+ throughput/total_tokens=177,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=928/500000]
+ train/ActionL1Loss=0.1164
+ throughput/total_tokens=178,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=929/500000]
+ train/ActionL1Loss=0.1149
+ throughput/total_tokens=178,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=930/500000]
+ train/ActionL1Loss=0.1023
+ throughput/total_tokens=178,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=931/500000]
+ train/ActionL1Loss=0.1223
+ throughput/total_tokens=178,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=932/500000]
+ train/ActionL1Loss=0.1430
+ throughput/total_tokens=178,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=933/500000]
+ train/ActionL1Loss=0.1397
+ throughput/total_tokens=179,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=934/500000]
+ train/ActionL1Loss=0.1273
+ throughput/total_tokens=179,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=935/500000]
+ train/ActionL1Loss=0.1023
+ throughput/total_tokens=179,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=936/500000]
+ train/ActionL1Loss=0.1208
+ throughput/total_tokens=179,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=937/500000]
+ train/ActionL1Loss=0.1206
+ throughput/total_tokens=179,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=938/500000]
+ train/ActionL1Loss=0.1010
+ throughput/total_tokens=180,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=939/500000]
+ train/ActionL1Loss=0.1330
+ throughput/total_tokens=180,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=940/500000]
+ optim/total_grad_norm=11.93
+ train/ActionL1Loss=0.1023
+ throughput/total_tokens=180,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=941/500000]
+ train/ActionL1Loss=0.1269
+ throughput/total_tokens=180,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=942/500000]
+ train/ActionL1Loss=0.1133
+ throughput/total_tokens=180,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=943/500000]
+ train/ActionL1Loss=0.1258
+ throughput/total_tokens=181,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=944/500000]
+ train/ActionL1Loss=0.1067
+ throughput/total_tokens=181,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=945/500000]
+ train/ActionL1Loss=0.1129
+ throughput/total_tokens=181,440,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=946/500000]
+ train/ActionL1Loss=0.0979
+ throughput/total_tokens=181,632,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=947/500000]
+ train/ActionL1Loss=0.1326
+ throughput/total_tokens=181,824,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=948/500000]
+ train/ActionL1Loss=0.1162
+ throughput/total_tokens=182,016,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=949/500000]
+ train/ActionL1Loss=0.1125
+ throughput/total_tokens=182,208,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=950/500000]
+ train/ActionL1Loss=0.1127
+ throughput/total_tokens=182,400,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=951/500000]
+ train/ActionL1Loss=0.1152
+ throughput/total_tokens=182,592,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=952/500000]
+ train/ActionL1Loss=0.0925
+ throughput/total_tokens=182,784,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=953/500000]
+ train/ActionL1Loss=0.1043
+ throughput/total_tokens=182,976,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=954/500000]
+ train/ActionL1Loss=0.1126
+ throughput/total_tokens=183,168,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=955/500000]
+ train/ActionL1Loss=0.0950
+ throughput/total_tokens=183,360,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=956/500000]
+ train/ActionL1Loss=0.0853
+ throughput/total_tokens=183,552,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=957/500000]
+ train/ActionL1Loss=0.1266
+ throughput/total_tokens=183,744,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=958/500000]
+ train/ActionL1Loss=0.1275
+ throughput/total_tokens=183,936,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=959/500000]
+ train/ActionL1Loss=0.1240
+ throughput/total_tokens=184,128,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=960/500000]
+ optim/total_grad_norm=11.71
+ train/ActionL1Loss=0.1207
+ throughput/total_tokens=184,320,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=46,917
+[step=961/500000]
+ train/ActionL1Loss=0.1153
+ throughput/total_tokens=184,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=962/500000]
+ train/ActionL1Loss=0.1153
+ throughput/total_tokens=184,704,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=963/500000]
+ train/ActionL1Loss=0.1175
+ throughput/total_tokens=184,896,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=964/500000]
+ train/ActionL1Loss=0.1110
+ throughput/total_tokens=185,088,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+[step=965/500000]
+ train/ActionL1Loss=0.1066
+ throughput/total_tokens=185,280,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=966/500000]
+ train/ActionL1Loss=0.1103
+ throughput/total_tokens=185,472,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=967/500000]
+ train/ActionL1Loss=0.1274
+ throughput/total_tokens=185,664,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=968/500000]
+ train/ActionL1Loss=0.1177
+ throughput/total_tokens=185,856,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=969/500000]
+ train/ActionL1Loss=0.1133
+ throughput/total_tokens=186,048,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=970/500000]
+ train/ActionL1Loss=0.1266
+ throughput/total_tokens=186,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=971/500000]
+ train/ActionL1Loss=0.1257
+ throughput/total_tokens=186,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=972/500000]
+ train/ActionL1Loss=0.1315
+ throughput/total_tokens=186,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=973/500000]
+ train/ActionL1Loss=0.1129
+ throughput/total_tokens=186,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=974/500000]
+ train/ActionL1Loss=0.1101
+ throughput/total_tokens=187,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=975/500000]
+ train/ActionL1Loss=0.1237
+ throughput/total_tokens=187,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=976/500000]
+ train/ActionL1Loss=0.1196
+ throughput/total_tokens=187,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=977/500000]
+ train/ActionL1Loss=0.1346
+ throughput/total_tokens=187,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=978/500000]
+ train/ActionL1Loss=0.1207
+ throughput/total_tokens=187,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=979/500000]
+ train/ActionL1Loss=0.1127
+ throughput/total_tokens=187,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=980/500000]
+ optim/total_grad_norm=9.464
+ train/ActionL1Loss=0.1158
+ throughput/total_tokens=188,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=981/500000]
+ train/ActionL1Loss=0.1139
+ throughput/total_tokens=188,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=982/500000]
+ train/ActionL1Loss=0.1109
+ throughput/total_tokens=188,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=983/500000]
+ train/ActionL1Loss=0.1082
+ throughput/total_tokens=188,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=984/500000]
+ train/ActionL1Loss=0.1215
+ throughput/total_tokens=188,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=985/500000]
+ train/ActionL1Loss=0.1109
+ throughput/total_tokens=189,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=986/500000]
+ train/ActionL1Loss=0.1229
+ throughput/total_tokens=189,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=987/500000]
+ train/ActionL1Loss=0.1145
+ throughput/total_tokens=189,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=988/500000]
+ train/ActionL1Loss=0.1049
+ throughput/total_tokens=189,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=989/500000]
+ train/ActionL1Loss=0.0950
+ throughput/total_tokens=189,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=990/500000]
+ train/ActionL1Loss=0.1014
+ throughput/total_tokens=190,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=991/500000]
+ train/ActionL1Loss=0.1039
+ throughput/total_tokens=190,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=992/500000]
+ train/ActionL1Loss=0.1151
+ throughput/total_tokens=190,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=993/500000]
+ train/ActionL1Loss=0.1113
+ throughput/total_tokens=190,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=994/500000]
+ train/ActionL1Loss=0.0836
+ throughput/total_tokens=190,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=995/500000]
+ train/ActionL1Loss=0.0874
+ throughput/total_tokens=191,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=996/500000]
+ train/ActionL1Loss=0.0955
+ throughput/total_tokens=191,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=997/500000]
+ train/ActionL1Loss=0.1118
+ throughput/total_tokens=191,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=998/500000]
+ train/ActionL1Loss=0.0876
+ throughput/total_tokens=191,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=999/500000]
+ train/ActionL1Loss=0.1093
+ throughput/total_tokens=191,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1000/500000]
+ optim/total_grad_norm=14.04
+ train/ActionL1Loss=0.1204
+ throughput/total_tokens=192,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/02 [22:22:34] INFO | >> Saving config... checkpoint.py:608
+10/02 [22:23:26] INFO | >> Saving model state... checkpoint.py:796
+10/02 [22:24:35] INFO | >> Saving optim state... checkpoint.py:811
+10/02 [22:26:05] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1001/500000]
+ train/ActionL1Loss=0.1009
+ throughput/total_tokens=192,192,000
+ throughput/device/tokens_per_second=1,209
+ throughput/device/batches_per_second=0.0504
+[step=1002/500000]
+ train/ActionL1Loss=0.0892
+ throughput/total_tokens=192,384,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1003/500000]
+ train/ActionL1Loss=0.0996
+ throughput/total_tokens=192,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1004/500000]
+ train/ActionL1Loss=0.1003
+ throughput/total_tokens=192,768,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1005/500000]
+ train/ActionL1Loss=0.1186
+ throughput/total_tokens=192,960,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1006/500000]
+ train/ActionL1Loss=0.1340
+ throughput/total_tokens=193,152,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1007/500000]
+ train/ActionL1Loss=0.1136
+ throughput/total_tokens=193,344,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1008/500000]
+ train/ActionL1Loss=0.0878
+ throughput/total_tokens=193,536,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1009/500000]
+ train/ActionL1Loss=0.1025
+ throughput/total_tokens=193,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1010/500000]
+ train/ActionL1Loss=0.0948
+ throughput/total_tokens=193,920,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1011/500000]
+ train/ActionL1Loss=0.0864
+ throughput/total_tokens=194,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1012/500000]
+ train/ActionL1Loss=0.1225
+ throughput/total_tokens=194,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1013/500000]
+ train/ActionL1Loss=0.1050
+ throughput/total_tokens=194,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1014/500000]
+ train/ActionL1Loss=0.1114
+ throughput/total_tokens=194,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1015/500000]
+ train/ActionL1Loss=0.1079
+ throughput/total_tokens=194,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1016/500000]
+ train/ActionL1Loss=0.0970
+ throughput/total_tokens=195,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1017/500000]
+ train/ActionL1Loss=0.1136
+ throughput/total_tokens=195,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1018/500000]
+ train/ActionL1Loss=0.1250
+ throughput/total_tokens=195,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1019/500000]
+ train/ActionL1Loss=0.0926
+ throughput/total_tokens=195,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1020/500000]
+ optim/total_grad_norm=12.95
+ train/ActionL1Loss=0.1052
+ throughput/total_tokens=195,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1021/500000]
+ train/ActionL1Loss=0.1033
+ throughput/total_tokens=196,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1022/500000]
+ train/ActionL1Loss=0.1044
+ throughput/total_tokens=196,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1023/500000]
+ train/ActionL1Loss=0.0912
+ throughput/total_tokens=196,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1024/500000]
+ train/ActionL1Loss=0.1056
+ throughput/total_tokens=196,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1025/500000]
+ train/ActionL1Loss=0.0974
+ throughput/total_tokens=196,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1026/500000]
+ train/ActionL1Loss=0.1003
+ throughput/total_tokens=196,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1027/500000]
+ train/ActionL1Loss=0.0981
+ throughput/total_tokens=197,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1028/500000]
+ train/ActionL1Loss=0.0912
+ throughput/total_tokens=197,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1029/500000]
+ train/ActionL1Loss=0.0952
+ throughput/total_tokens=197,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1030/500000]
+ train/ActionL1Loss=0.0887
+ throughput/total_tokens=197,760,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1031/500000]
+ train/ActionL1Loss=0.1210
+ throughput/total_tokens=197,952,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1032/500000]
+ train/ActionL1Loss=0.1048
+ throughput/total_tokens=198,144,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1033/500000]
+ train/ActionL1Loss=0.1058
+ throughput/total_tokens=198,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1034/500000]
+ train/ActionL1Loss=0.1074
+ throughput/total_tokens=198,528,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1035/500000]
+ train/ActionL1Loss=0.0962
+ throughput/total_tokens=198,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1036/500000]
+ train/ActionL1Loss=0.0937
+ throughput/total_tokens=198,912,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1037/500000]
+ train/ActionL1Loss=0.0986
+ throughput/total_tokens=199,104,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1038/500000]
+ train/ActionL1Loss=0.0839
+ throughput/total_tokens=199,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1039/500000]
+ train/ActionL1Loss=0.1171
+ throughput/total_tokens=199,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1040/500000]
+ optim/total_grad_norm=10.64
+ train/ActionL1Loss=0.1244
+ throughput/total_tokens=199,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1041/500000]
+ train/ActionL1Loss=0.1205
+ throughput/total_tokens=199,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1042/500000]
+ train/ActionL1Loss=0.1048
+ throughput/total_tokens=200,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1043/500000]
+ train/ActionL1Loss=0.1173
+ throughput/total_tokens=200,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1044/500000]
+ train/ActionL1Loss=0.1050
+ throughput/total_tokens=200,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1045/500000]
+ train/ActionL1Loss=0.0962
+ throughput/total_tokens=200,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1046/500000]
+ train/ActionL1Loss=0.1132
+ throughput/total_tokens=200,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1047/500000]
+ train/ActionL1Loss=0.1162
+ throughput/total_tokens=201,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1048/500000]
+ train/ActionL1Loss=0.1008
+ throughput/total_tokens=201,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1049/500000]
+ train/ActionL1Loss=0.1217
+ throughput/total_tokens=201,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1050/500000]
+ train/ActionL1Loss=0.1391
+ throughput/total_tokens=201,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1051/500000]
+ train/ActionL1Loss=0.1270
+ throughput/total_tokens=201,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1052/500000]
+ train/ActionL1Loss=0.1197
+ throughput/total_tokens=201,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1053/500000]
+ train/ActionL1Loss=0.1115
+ throughput/total_tokens=202,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1054/500000]
+ train/ActionL1Loss=0.1190
+ throughput/total_tokens=202,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1055/500000]
+ train/ActionL1Loss=0.1293
+ throughput/total_tokens=202,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1056/500000]
+ train/ActionL1Loss=0.1280
+ throughput/total_tokens=202,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1057/500000]
+ train/ActionL1Loss=0.1265
+ throughput/total_tokens=202,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1058/500000]
+ train/ActionL1Loss=0.1079
+ throughput/total_tokens=203,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1059/500000]
+ train/ActionL1Loss=0.1023
+ throughput/total_tokens=203,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1060/500000]
+ optim/total_grad_norm=8.119
+ train/ActionL1Loss=0.1098
+ throughput/total_tokens=203,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1061/500000]
+ train/ActionL1Loss=0.1150
+ throughput/total_tokens=203,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1062/500000]
+ train/ActionL1Loss=0.1089
+ throughput/total_tokens=203,904,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1063/500000]
+ train/ActionL1Loss=0.0939
+ throughput/total_tokens=204,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1064/500000]
+ train/ActionL1Loss=0.1124
+ throughput/total_tokens=204,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1065/500000]
+ train/ActionL1Loss=0.1101
+ throughput/total_tokens=204,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1066/500000]
+ train/ActionL1Loss=0.0943
+ throughput/total_tokens=204,672,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1067/500000]
+ train/ActionL1Loss=0.0957
+ throughput/total_tokens=204,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1068/500000]
+ train/ActionL1Loss=0.0943
+ throughput/total_tokens=205,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1069/500000]
+ train/ActionL1Loss=0.1140
+ throughput/total_tokens=205,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1070/500000]
+ train/ActionL1Loss=0.1202
+ throughput/total_tokens=205,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1071/500000]
+ train/ActionL1Loss=0.0942
+ throughput/total_tokens=205,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1072/500000]
+ train/ActionL1Loss=0.0722
+ throughput/total_tokens=205,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1073/500000]
+ train/ActionL1Loss=0.0906
+ throughput/total_tokens=206,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1074/500000]
+ train/ActionL1Loss=0.0958
+ throughput/total_tokens=206,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1075/500000]
+ train/ActionL1Loss=0.1003
+ throughput/total_tokens=206,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1076/500000]
+ train/ActionL1Loss=0.0956
+ throughput/total_tokens=206,592,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1077/500000]
+ train/ActionL1Loss=0.0953
+ throughput/total_tokens=206,784,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1078/500000]
+ train/ActionL1Loss=0.1074
+ throughput/total_tokens=206,976,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1079/500000]
+ train/ActionL1Loss=0.1273
+ throughput/total_tokens=207,168,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1080/500000]
+ optim/total_grad_norm=9.768
+ train/ActionL1Loss=0.1041
+ throughput/total_tokens=207,360,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1081/500000]
+ train/ActionL1Loss=0.1111
+ throughput/total_tokens=207,552,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1082/500000]
+ train/ActionL1Loss=0.1036
+ throughput/total_tokens=207,744,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1083/500000]
+ train/ActionL1Loss=0.0896
+ throughput/total_tokens=207,936,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1084/500000]
+ train/ActionL1Loss=0.0655
+ throughput/total_tokens=208,128,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1085/500000]
+ train/ActionL1Loss=0.0985
+ throughput/total_tokens=208,320,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1086/500000]
+ train/ActionL1Loss=0.1019
+ throughput/total_tokens=208,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1087/500000]
+ train/ActionL1Loss=0.0921
+ throughput/total_tokens=208,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1088/500000]
+ train/ActionL1Loss=0.0800
+ throughput/total_tokens=208,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1089/500000]
+ train/ActionL1Loss=0.0924
+ throughput/total_tokens=209,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1090/500000]
+ train/ActionL1Loss=0.0759
+ throughput/total_tokens=209,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1091/500000]
+ train/ActionL1Loss=0.0843
+ throughput/total_tokens=209,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1092/500000]
+ train/ActionL1Loss=0.1128
+ throughput/total_tokens=209,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1093/500000]
+ train/ActionL1Loss=0.0950
+ throughput/total_tokens=209,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1094/500000]
+ train/ActionL1Loss=0.1108
+ throughput/total_tokens=210,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1095/500000]
+ train/ActionL1Loss=0.1040
+ throughput/total_tokens=210,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1096/500000]
+ train/ActionL1Loss=0.1042
+ throughput/total_tokens=210,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1097/500000]
+ train/ActionL1Loss=0.1197
+ throughput/total_tokens=210,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1098/500000]
+ train/ActionL1Loss=0.0929
+ throughput/total_tokens=210,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1099/500000]
+ train/ActionL1Loss=0.0937
+ throughput/total_tokens=211,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1100/500000]
+ optim/total_grad_norm=10.03
+ train/ActionL1Loss=0.0880
+ throughput/total_tokens=211,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1101/500000]
+ train/ActionL1Loss=0.1207
+ throughput/total_tokens=211,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1102/500000]
+ train/ActionL1Loss=0.1034
+ throughput/total_tokens=211,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1103/500000]
+ train/ActionL1Loss=0.0961
+ throughput/total_tokens=211,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1104/500000]
+ train/ActionL1Loss=0.1093
+ throughput/total_tokens=211,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1105/500000]
+ train/ActionL1Loss=0.1039
+ throughput/total_tokens=212,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1106/500000]
+ train/ActionL1Loss=0.1395
+ throughput/total_tokens=212,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1107/500000]
+ train/ActionL1Loss=0.1318
+ throughput/total_tokens=212,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1108/500000]
+ train/ActionL1Loss=0.0996
+ throughput/total_tokens=212,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1109/500000]
+ train/ActionL1Loss=0.1038
+ throughput/total_tokens=212,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1110/500000]
+ train/ActionL1Loss=0.1105
+ throughput/total_tokens=213,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1111/500000]
+ train/ActionL1Loss=0.1094
+ throughput/total_tokens=213,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1112/500000]
+ train/ActionL1Loss=0.0982
+ throughput/total_tokens=213,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1113/500000]
+ train/ActionL1Loss=0.1138
+ throughput/total_tokens=213,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1114/500000]
+ train/ActionL1Loss=0.1013
+ throughput/total_tokens=213,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1115/500000]
+ train/ActionL1Loss=0.1131
+ throughput/total_tokens=214,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1116/500000]
+ train/ActionL1Loss=0.1138
+ throughput/total_tokens=214,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1117/500000]
+ train/ActionL1Loss=0.1118
+ throughput/total_tokens=214,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1118/500000]
+ train/ActionL1Loss=0.1075
+ throughput/total_tokens=214,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1119/500000]
+ train/ActionL1Loss=0.1234
+ throughput/total_tokens=214,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1120/500000]
+ optim/total_grad_norm=11.69
+ train/ActionL1Loss=0.1076
+ throughput/total_tokens=215,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1121/500000]
+ train/ActionL1Loss=0.1139
+ throughput/total_tokens=215,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1122/500000]
+ train/ActionL1Loss=0.1225
+ throughput/total_tokens=215,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1123/500000]
+ train/ActionL1Loss=0.1211
+ throughput/total_tokens=215,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1124/500000]
+ train/ActionL1Loss=0.1179
+ throughput/total_tokens=215,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1125/500000]
+ train/ActionL1Loss=0.1381
+ throughput/total_tokens=216,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1126/500000]
+ train/ActionL1Loss=0.1235
+ throughput/total_tokens=216,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1127/500000]
+ train/ActionL1Loss=0.2518
+ throughput/total_tokens=216,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1128/500000]
+ train/ActionL1Loss=0.5933
+ throughput/total_tokens=216,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1129/500000]
+ train/ActionL1Loss=0.1505
+ throughput/total_tokens=216,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1130/500000]
+ train/ActionL1Loss=0.1206
+ throughput/total_tokens=216,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1131/500000]
+ train/ActionL1Loss=0.1292
+ throughput/total_tokens=217,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1132/500000]
+ train/ActionL1Loss=0.1603
+ throughput/total_tokens=217,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1133/500000]
+ train/ActionL1Loss=0.1245
+ throughput/total_tokens=217,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1134/500000]
+ train/ActionL1Loss=0.1270
+ throughput/total_tokens=217,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1135/500000]
+ train/ActionL1Loss=0.1221
+ throughput/total_tokens=217,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1136/500000]
+ train/ActionL1Loss=0.1139
+ throughput/total_tokens=218,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1137/500000]
+ train/ActionL1Loss=0.1326
+ throughput/total_tokens=218,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1138/500000]
+ train/ActionL1Loss=0.1118
+ throughput/total_tokens=218,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1139/500000]
+ train/ActionL1Loss=0.1115
+ throughput/total_tokens=218,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1140/500000]
+ optim/total_grad_norm=11.76
+ train/ActionL1Loss=0.1329
+ throughput/total_tokens=218,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1141/500000]
+ train/ActionL1Loss=0.1509
+ throughput/total_tokens=219,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1142/500000]
+ train/ActionL1Loss=0.1145
+ throughput/total_tokens=219,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1143/500000]
+ train/ActionL1Loss=0.1143
+ throughput/total_tokens=219,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1144/500000]
+ train/ActionL1Loss=0.1175
+ throughput/total_tokens=219,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1145/500000]
+ train/ActionL1Loss=0.0931
+ throughput/total_tokens=219,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1146/500000]
+ train/ActionL1Loss=0.1013
+ throughput/total_tokens=220,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1147/500000]
+ train/ActionL1Loss=0.0945
+ throughput/total_tokens=220,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1148/500000]
+ train/ActionL1Loss=0.1179
+ throughput/total_tokens=220,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1149/500000]
+ train/ActionL1Loss=0.1097
+ throughput/total_tokens=220,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1150/500000]
+ train/ActionL1Loss=0.1302
+ throughput/total_tokens=220,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1151/500000]
+ train/ActionL1Loss=0.1011
+ throughput/total_tokens=220,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1152/500000]
+ train/ActionL1Loss=0.1340
+ throughput/total_tokens=221,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1153/500000]
+ train/ActionL1Loss=0.1219
+ throughput/total_tokens=221,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1154/500000]
+ train/ActionL1Loss=0.1269
+ throughput/total_tokens=221,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1155/500000]
+ train/ActionL1Loss=0.1180
+ throughput/total_tokens=221,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1156/500000]
+ train/ActionL1Loss=0.1089
+ throughput/total_tokens=221,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1157/500000]
+ train/ActionL1Loss=0.1010
+ throughput/total_tokens=222,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1158/500000]
+ train/ActionL1Loss=0.1252
+ throughput/total_tokens=222,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1159/500000]
+ train/ActionL1Loss=0.1389
+ throughput/total_tokens=222,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1160/500000]
+ optim/total_grad_norm=12.66
+ train/ActionL1Loss=0.1283
+ throughput/total_tokens=222,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1161/500000]
+ train/ActionL1Loss=0.1442
+ throughput/total_tokens=222,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1162/500000]
+ train/ActionL1Loss=0.1136
+ throughput/total_tokens=223,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1163/500000]
+ train/ActionL1Loss=0.1391
+ throughput/total_tokens=223,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1164/500000]
+ train/ActionL1Loss=0.1326
+ throughput/total_tokens=223,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1165/500000]
+ train/ActionL1Loss=0.1230
+ throughput/total_tokens=223,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1166/500000]
+ train/ActionL1Loss=0.1389
+ throughput/total_tokens=223,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1167/500000]
+ train/ActionL1Loss=0.1070
+ throughput/total_tokens=224,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1168/500000]
+ train/ActionL1Loss=0.1042
+ throughput/total_tokens=224,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1169/500000]
+ train/ActionL1Loss=0.1205
+ throughput/total_tokens=224,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1170/500000]
+ train/ActionL1Loss=0.1155
+ throughput/total_tokens=224,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1171/500000]
+ train/ActionL1Loss=0.1223
+ throughput/total_tokens=224,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1172/500000]
+ train/ActionL1Loss=0.0917
+ throughput/total_tokens=225,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1173/500000]
+ train/ActionL1Loss=0.1116
+ throughput/total_tokens=225,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1174/500000]
+ train/ActionL1Loss=0.0888
+ throughput/total_tokens=225,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1175/500000]
+ train/ActionL1Loss=0.1006
+ throughput/total_tokens=225,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1176/500000]
+ train/ActionL1Loss=0.1062
+ throughput/total_tokens=225,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1177/500000]
+ train/ActionL1Loss=0.1158
+ throughput/total_tokens=225,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1178/500000]
+ train/ActionL1Loss=0.1149
+ throughput/total_tokens=226,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1179/500000]
+ train/ActionL1Loss=0.1193
+ throughput/total_tokens=226,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1180/500000]
+ optim/total_grad_norm=9.876
+ train/ActionL1Loss=0.0896
+ throughput/total_tokens=226,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1181/500000]
+ train/ActionL1Loss=0.1106
+ throughput/total_tokens=226,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1182/500000]
+ train/ActionL1Loss=0.1164
+ throughput/total_tokens=226,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1183/500000]
+ train/ActionL1Loss=0.0926
+ throughput/total_tokens=227,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1184/500000]
+ train/ActionL1Loss=0.1106
+ throughput/total_tokens=227,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1185/500000]
+ train/ActionL1Loss=0.0933
+ throughput/total_tokens=227,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1186/500000]
+ train/ActionL1Loss=0.1088
+ throughput/total_tokens=227,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1187/500000]
+ train/ActionL1Loss=0.1194
+ throughput/total_tokens=227,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1188/500000]
+ train/ActionL1Loss=0.0973
+ throughput/total_tokens=228,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1189/500000]
+ train/ActionL1Loss=0.1080
+ throughput/total_tokens=228,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1190/500000]
+ train/ActionL1Loss=0.1151
+ throughput/total_tokens=228,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1191/500000]
+ train/ActionL1Loss=0.1142
+ throughput/total_tokens=228,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1192/500000]
+ train/ActionL1Loss=0.1262
+ throughput/total_tokens=228,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1193/500000]
+ train/ActionL1Loss=0.1134
+ throughput/total_tokens=229,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1194/500000]
+ train/ActionL1Loss=0.0885
+ throughput/total_tokens=229,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1195/500000]
+ train/ActionL1Loss=0.0927
+ throughput/total_tokens=229,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1196/500000]
+ train/ActionL1Loss=0.1038
+ throughput/total_tokens=229,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1197/500000]
+ train/ActionL1Loss=0.1116
+ throughput/total_tokens=229,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1198/500000]
+ train/ActionL1Loss=0.1152
+ throughput/total_tokens=230,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1199/500000]
+ train/ActionL1Loss=0.0992
+ throughput/total_tokens=230,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1200/500000]
+ optim/total_grad_norm=11.83
+ train/ActionL1Loss=0.0885
+ throughput/total_tokens=230,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1201/500000]
+ train/ActionL1Loss=0.1015
+ throughput/total_tokens=230,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1202/500000]
+ train/ActionL1Loss=0.1191
+ throughput/total_tokens=230,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1203/500000]
+ train/ActionL1Loss=0.0934
+ throughput/total_tokens=230,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1204/500000]
+ train/ActionL1Loss=0.1084
+ throughput/total_tokens=231,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1205/500000]
+ train/ActionL1Loss=0.1224
+ throughput/total_tokens=231,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1206/500000]
+ train/ActionL1Loss=0.0976
+ throughput/total_tokens=231,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1207/500000]
+ train/ActionL1Loss=0.1032
+ throughput/total_tokens=231,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1208/500000]
+ train/ActionL1Loss=0.1156
+ throughput/total_tokens=231,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1209/500000]
+ train/ActionL1Loss=0.0990
+ throughput/total_tokens=232,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1210/500000]
+ train/ActionL1Loss=0.0856
+ throughput/total_tokens=232,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1211/500000]
+ train/ActionL1Loss=0.0925
+ throughput/total_tokens=232,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1212/500000]
+ train/ActionL1Loss=0.0951
+ throughput/total_tokens=232,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1213/500000]
+ train/ActionL1Loss=0.1302
+ throughput/total_tokens=232,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1214/500000]
+ train/ActionL1Loss=0.0986
+ throughput/total_tokens=233,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1215/500000]
+ train/ActionL1Loss=0.1152
+ throughput/total_tokens=233,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1216/500000]
+ train/ActionL1Loss=0.1098
+ throughput/total_tokens=233,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1217/500000]
+ train/ActionL1Loss=0.1175
+ throughput/total_tokens=233,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1218/500000]
+ train/ActionL1Loss=0.1025
+ throughput/total_tokens=233,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1219/500000]
+ train/ActionL1Loss=0.0983
+ throughput/total_tokens=234,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1220/500000]
+ optim/total_grad_norm=10.40
+ train/ActionL1Loss=0.0943
+ throughput/total_tokens=234,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1221/500000]
+ train/ActionL1Loss=0.0882
+ throughput/total_tokens=234,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1222/500000]
+ train/ActionL1Loss=0.1039
+ throughput/total_tokens=234,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1223/500000]
+ train/ActionL1Loss=0.1055
+ throughput/total_tokens=234,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1224/500000]
+ train/ActionL1Loss=0.0994
+ throughput/total_tokens=235,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1225/500000]
+ train/ActionL1Loss=0.1218
+ throughput/total_tokens=235,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1226/500000]
+ train/ActionL1Loss=0.1360
+ throughput/total_tokens=235,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1227/500000]
+ train/ActionL1Loss=0.0998
+ throughput/total_tokens=235,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1228/500000]
+ train/ActionL1Loss=0.0993
+ throughput/total_tokens=235,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1229/500000]
+ train/ActionL1Loss=0.1266
+ throughput/total_tokens=235,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1230/500000]
+ train/ActionL1Loss=0.1416
+ throughput/total_tokens=236,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1231/500000]
+ train/ActionL1Loss=0.1120
+ throughput/total_tokens=236,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1232/500000]
+ train/ActionL1Loss=0.1000
+ throughput/total_tokens=236,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1233/500000]
+ train/ActionL1Loss=0.1232
+ throughput/total_tokens=236,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1234/500000]
+ train/ActionL1Loss=0.1109
+ throughput/total_tokens=236,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1235/500000]
+ train/ActionL1Loss=0.1297
+ throughput/total_tokens=237,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1236/500000]
+ train/ActionL1Loss=0.1062
+ throughput/total_tokens=237,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1237/500000]
+ train/ActionL1Loss=0.0721
+ throughput/total_tokens=237,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1238/500000]
+ train/ActionL1Loss=0.0891
+ throughput/total_tokens=237,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1239/500000]
+ train/ActionL1Loss=0.1108
+ throughput/total_tokens=237,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1240/500000]
+ optim/total_grad_norm=9.974
+ train/ActionL1Loss=0.1151
+ throughput/total_tokens=238,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1241/500000]
+ train/ActionL1Loss=0.1023
+ throughput/total_tokens=238,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1242/500000]
+ train/ActionL1Loss=0.1099
+ throughput/total_tokens=238,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1243/500000]
+ train/ActionL1Loss=0.1228
+ throughput/total_tokens=238,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1244/500000]
+ train/ActionL1Loss=0.1115
+ throughput/total_tokens=238,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1245/500000]
+ train/ActionL1Loss=0.1071
+ throughput/total_tokens=239,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1246/500000]
+ train/ActionL1Loss=0.0928
+ throughput/total_tokens=239,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1247/500000]
+ train/ActionL1Loss=0.1227
+ throughput/total_tokens=239,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1248/500000]
+ train/ActionL1Loss=0.0972
+ throughput/total_tokens=239,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1249/500000]
+ train/ActionL1Loss=0.0923
+ throughput/total_tokens=239,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1250/500000]
+ train/ActionL1Loss=0.1063
+ throughput/total_tokens=240,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1251/500000]
+ train/ActionL1Loss=0.1081
+ throughput/total_tokens=240,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1252/500000]
+ train/ActionL1Loss=0.0995
+ throughput/total_tokens=240,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1253/500000]
+ train/ActionL1Loss=0.1025
+ throughput/total_tokens=240,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1254/500000]
+ train/ActionL1Loss=0.0960
+ throughput/total_tokens=240,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1255/500000]
+ train/ActionL1Loss=0.1144
+ throughput/total_tokens=240,960,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1256/500000]
+ train/ActionL1Loss=0.0915
+ throughput/total_tokens=241,152,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1257/500000]
+ train/ActionL1Loss=0.0897
+ throughput/total_tokens=241,344,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1258/500000]
+ train/ActionL1Loss=0.0915
+ throughput/total_tokens=241,536,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1259/500000]
+ train/ActionL1Loss=0.0970
+ throughput/total_tokens=241,728,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1260/500000]
+ optim/total_grad_norm=11.88
+ train/ActionL1Loss=0.1047
+ throughput/total_tokens=241,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1261/500000]
+ train/ActionL1Loss=0.1006
+ throughput/total_tokens=242,112,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1262/500000]
+ train/ActionL1Loss=0.1063
+ throughput/total_tokens=242,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1263/500000]
+ train/ActionL1Loss=0.0890
+ throughput/total_tokens=242,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1264/500000]
+ train/ActionL1Loss=0.1180
+ throughput/total_tokens=242,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1265/500000]
+ train/ActionL1Loss=0.0994
+ throughput/total_tokens=242,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1266/500000]
+ train/ActionL1Loss=0.0853
+ throughput/total_tokens=243,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1267/500000]
+ train/ActionL1Loss=0.0829
+ throughput/total_tokens=243,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1268/500000]
+ train/ActionL1Loss=0.1032
+ throughput/total_tokens=243,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1269/500000]
+ train/ActionL1Loss=0.0987
+ throughput/total_tokens=243,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1270/500000]
+ train/ActionL1Loss=0.1036
+ throughput/total_tokens=243,840,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1271/500000]
+ train/ActionL1Loss=0.0934
+ throughput/total_tokens=244,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1272/500000]
+ train/ActionL1Loss=0.1063
+ throughput/total_tokens=244,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1273/500000]
+ train/ActionL1Loss=0.1018
+ throughput/total_tokens=244,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1274/500000]
+ train/ActionL1Loss=0.0991
+ throughput/total_tokens=244,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1275/500000]
+ train/ActionL1Loss=0.0877
+ throughput/total_tokens=244,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1276/500000]
+ train/ActionL1Loss=0.0850
+ throughput/total_tokens=244,992,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1277/500000]
+ train/ActionL1Loss=0.1026
+ throughput/total_tokens=245,184,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1278/500000]
+ train/ActionL1Loss=0.1024
+ throughput/total_tokens=245,376,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1279/500000]
+ train/ActionL1Loss=0.0876
+ throughput/total_tokens=245,568,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1280/500000]
+ optim/total_grad_norm=7.288
+ train/ActionL1Loss=0.1021
+ throughput/total_tokens=245,760,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1281/500000]
+ train/ActionL1Loss=0.0855
+ throughput/total_tokens=245,952,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1282/500000]
+ train/ActionL1Loss=0.0905
+ throughput/total_tokens=246,144,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1283/500000]
+ train/ActionL1Loss=0.1075
+ throughput/total_tokens=246,336,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1284/500000]
+ train/ActionL1Loss=0.1010
+ throughput/total_tokens=246,528,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1285/500000]
+ train/ActionL1Loss=0.1305
+ throughput/total_tokens=246,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1286/500000]
+ train/ActionL1Loss=0.0858
+ throughput/total_tokens=246,912,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1287/500000]
+ train/ActionL1Loss=0.1182
+ throughput/total_tokens=247,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1288/500000]
+ train/ActionL1Loss=0.1332
+ throughput/total_tokens=247,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1289/500000]
+ train/ActionL1Loss=0.1314
+ throughput/total_tokens=247,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1290/500000]
+ train/ActionL1Loss=0.0966
+ throughput/total_tokens=247,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1291/500000]
+ train/ActionL1Loss=0.0847
+ throughput/total_tokens=247,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1292/500000]
+ train/ActionL1Loss=0.0978
+ throughput/total_tokens=248,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1293/500000]
+ train/ActionL1Loss=0.0934
+ throughput/total_tokens=248,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1294/500000]
+ train/ActionL1Loss=0.0838
+ throughput/total_tokens=248,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1295/500000]
+ train/ActionL1Loss=0.0876
+ throughput/total_tokens=248,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1296/500000]
+ train/ActionL1Loss=0.1137
+ throughput/total_tokens=248,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1297/500000]
+ train/ActionL1Loss=0.0838
+ throughput/total_tokens=249,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1298/500000]
+ train/ActionL1Loss=0.0698
+ throughput/total_tokens=249,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1299/500000]
+ train/ActionL1Loss=0.1044
+ throughput/total_tokens=249,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1300/500000]
+ optim/total_grad_norm=11.08
+ train/ActionL1Loss=0.0969
+ throughput/total_tokens=249,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1301/500000]
+ train/ActionL1Loss=0.0943
+ throughput/total_tokens=249,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1302/500000]
+ train/ActionL1Loss=0.1323
+ throughput/total_tokens=249,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1303/500000]
+ train/ActionL1Loss=0.1152
+ throughput/total_tokens=250,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1304/500000]
+ train/ActionL1Loss=0.1084
+ throughput/total_tokens=250,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1305/500000]
+ train/ActionL1Loss=0.0875
+ throughput/total_tokens=250,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1306/500000]
+ train/ActionL1Loss=0.0884
+ throughput/total_tokens=250,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1307/500000]
+ train/ActionL1Loss=0.0925
+ throughput/total_tokens=250,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1308/500000]
+ train/ActionL1Loss=0.1181
+ throughput/total_tokens=251,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1309/500000]
+ train/ActionL1Loss=0.1293
+ throughput/total_tokens=251,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1310/500000]
+ train/ActionL1Loss=0.1083
+ throughput/total_tokens=251,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1311/500000]
+ train/ActionL1Loss=0.1226
+ throughput/total_tokens=251,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1312/500000]
+ train/ActionL1Loss=0.0892
+ throughput/total_tokens=251,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1313/500000]
+ train/ActionL1Loss=0.1089
+ throughput/total_tokens=252,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1314/500000]
+ train/ActionL1Loss=0.1155
+ throughput/total_tokens=252,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1315/500000]
+ train/ActionL1Loss=0.0842
+ throughput/total_tokens=252,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1316/500000]
+ train/ActionL1Loss=0.0963
+ throughput/total_tokens=252,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1317/500000]
+ train/ActionL1Loss=0.0980
+ throughput/total_tokens=252,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1318/500000]
+ train/ActionL1Loss=0.1073
+ throughput/total_tokens=253,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1319/500000]
+ train/ActionL1Loss=0.1089
+ throughput/total_tokens=253,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1320/500000]
+ optim/total_grad_norm=9.553
+ train/ActionL1Loss=0.1042
+ throughput/total_tokens=253,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1321/500000]
+ train/ActionL1Loss=0.1007
+ throughput/total_tokens=253,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1322/500000]
+ train/ActionL1Loss=0.1139
+ throughput/total_tokens=253,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1323/500000]
+ train/ActionL1Loss=0.0954
+ throughput/total_tokens=254,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1324/500000]
+ train/ActionL1Loss=0.0974
+ throughput/total_tokens=254,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1325/500000]
+ train/ActionL1Loss=0.1059
+ throughput/total_tokens=254,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1326/500000]
+ train/ActionL1Loss=0.0936
+ throughput/total_tokens=254,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1327/500000]
+ train/ActionL1Loss=0.1393
+ throughput/total_tokens=254,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1328/500000]
+ train/ActionL1Loss=0.0923
+ throughput/total_tokens=254,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1329/500000]
+ train/ActionL1Loss=0.1234
+ throughput/total_tokens=255,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1330/500000]
+ train/ActionL1Loss=0.0979
+ throughput/total_tokens=255,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1331/500000]
+ train/ActionL1Loss=0.1231
+ throughput/total_tokens=255,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1332/500000]
+ train/ActionL1Loss=0.0974
+ throughput/total_tokens=255,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1333/500000]
+ train/ActionL1Loss=0.0787
+ throughput/total_tokens=255,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1334/500000]
+ train/ActionL1Loss=0.1059
+ throughput/total_tokens=256,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1335/500000]
+ train/ActionL1Loss=0.0871
+ throughput/total_tokens=256,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1336/500000]
+ train/ActionL1Loss=0.1083
+ throughput/total_tokens=256,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1337/500000]
+ train/ActionL1Loss=0.0792
+ throughput/total_tokens=256,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1338/500000]
+ train/ActionL1Loss=0.1024
+ throughput/total_tokens=256,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1339/500000]
+ train/ActionL1Loss=0.0952
+ throughput/total_tokens=257,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1340/500000]
+ optim/total_grad_norm=10.28
+ train/ActionL1Loss=0.0780
+ throughput/total_tokens=257,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1341/500000]
+ train/ActionL1Loss=0.1066
+ throughput/total_tokens=257,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1342/500000]
+ train/ActionL1Loss=0.0914
+ throughput/total_tokens=257,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1343/500000]
+ train/ActionL1Loss=0.0739
+ throughput/total_tokens=257,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1344/500000]
+ train/ActionL1Loss=0.0831
+ throughput/total_tokens=258,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1345/500000]
+ train/ActionL1Loss=0.1061
+ throughput/total_tokens=258,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1346/500000]
+ train/ActionL1Loss=0.0977
+ throughput/total_tokens=258,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1347/500000]
+ train/ActionL1Loss=0.1028
+ throughput/total_tokens=258,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1348/500000]
+ train/ActionL1Loss=0.1020
+ throughput/total_tokens=258,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1349/500000]
+ train/ActionL1Loss=0.0992
+ throughput/total_tokens=259,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1350/500000]
+ train/ActionL1Loss=0.0914
+ throughput/total_tokens=259,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1351/500000]
+ train/ActionL1Loss=0.1067
+ throughput/total_tokens=259,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1352/500000]
+ train/ActionL1Loss=0.1133
+ throughput/total_tokens=259,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1353/500000]
+ train/ActionL1Loss=0.1055
+ throughput/total_tokens=259,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1354/500000]
+ train/ActionL1Loss=0.0859
+ throughput/total_tokens=259,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1355/500000]
+ train/ActionL1Loss=0.1026
+ throughput/total_tokens=260,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1356/500000]
+ train/ActionL1Loss=0.0787
+ throughput/total_tokens=260,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1357/500000]
+ train/ActionL1Loss=0.0834
+ throughput/total_tokens=260,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1358/500000]
+ train/ActionL1Loss=0.1104
+ throughput/total_tokens=260,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1359/500000]
+ train/ActionL1Loss=0.1034
+ throughput/total_tokens=260,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1360/500000]
+ optim/total_grad_norm=8.911
+ train/ActionL1Loss=0.1024
+ throughput/total_tokens=261,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1361/500000]
+ train/ActionL1Loss=0.1132
+ throughput/total_tokens=261,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1362/500000]
+ train/ActionL1Loss=0.1068
+ throughput/total_tokens=261,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1363/500000]
+ train/ActionL1Loss=0.1277
+ throughput/total_tokens=261,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1364/500000]
+ train/ActionL1Loss=0.1149
+ throughput/total_tokens=261,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1365/500000]
+ train/ActionL1Loss=0.0882
+ throughput/total_tokens=262,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1366/500000]
+ train/ActionL1Loss=0.1017
+ throughput/total_tokens=262,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1367/500000]
+ train/ActionL1Loss=0.0993
+ throughput/total_tokens=262,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1368/500000]
+ train/ActionL1Loss=0.0997
+ throughput/total_tokens=262,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1369/500000]
+ train/ActionL1Loss=0.0900
+ throughput/total_tokens=262,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1370/500000]
+ train/ActionL1Loss=0.1199
+ throughput/total_tokens=263,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1371/500000]
+ train/ActionL1Loss=0.1116
+ throughput/total_tokens=263,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1372/500000]
+ train/ActionL1Loss=0.1199
+ throughput/total_tokens=263,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1373/500000]
+ train/ActionL1Loss=0.1111
+ throughput/total_tokens=263,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1374/500000]
+ train/ActionL1Loss=0.1041
+ throughput/total_tokens=263,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1375/500000]
+ train/ActionL1Loss=0.0899
+ throughput/total_tokens=264,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1376/500000]
+ train/ActionL1Loss=0.0974
+ throughput/total_tokens=264,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1377/500000]
+ train/ActionL1Loss=0.0874
+ throughput/total_tokens=264,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1378/500000]
+ train/ActionL1Loss=0.0961
+ throughput/total_tokens=264,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1379/500000]
+ train/ActionL1Loss=0.0928
+ throughput/total_tokens=264,768,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1380/500000]
+ optim/total_grad_norm=10.39
+ train/ActionL1Loss=0.1087
+ throughput/total_tokens=264,960,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1381/500000]
+ train/ActionL1Loss=0.0990
+ throughput/total_tokens=265,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1382/500000]
+ train/ActionL1Loss=0.0934
+ throughput/total_tokens=265,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1383/500000]
+ train/ActionL1Loss=0.1091
+ throughput/total_tokens=265,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1384/500000]
+ train/ActionL1Loss=0.0965
+ throughput/total_tokens=265,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1385/500000]
+ train/ActionL1Loss=0.1223
+ throughput/total_tokens=265,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1386/500000]
+ train/ActionL1Loss=0.0951
+ throughput/total_tokens=266,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1387/500000]
+ train/ActionL1Loss=0.0731
+ throughput/total_tokens=266,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1388/500000]
+ train/ActionL1Loss=0.0857
+ throughput/total_tokens=266,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1389/500000]
+ train/ActionL1Loss=0.0895
+ throughput/total_tokens=266,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1390/500000]
+ train/ActionL1Loss=0.0843
+ throughput/total_tokens=266,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1391/500000]
+ train/ActionL1Loss=0.0995
+ throughput/total_tokens=267,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1392/500000]
+ train/ActionL1Loss=0.0883
+ throughput/total_tokens=267,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1393/500000]
+ train/ActionL1Loss=0.0963
+ throughput/total_tokens=267,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1394/500000]
+ train/ActionL1Loss=0.0988
+ throughput/total_tokens=267,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1395/500000]
+ train/ActionL1Loss=0.1058
+ throughput/total_tokens=267,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1396/500000]
+ train/ActionL1Loss=0.0971
+ throughput/total_tokens=268,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1397/500000]
+ train/ActionL1Loss=0.0912
+ throughput/total_tokens=268,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1398/500000]
+ train/ActionL1Loss=0.0818
+ throughput/total_tokens=268,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1399/500000]
+ train/ActionL1Loss=0.1002
+ throughput/total_tokens=268,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1400/500000]
+ optim/total_grad_norm=11.85
+ train/ActionL1Loss=0.0880
+ throughput/total_tokens=268,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1401/500000]
+ train/ActionL1Loss=0.1068
+ throughput/total_tokens=268,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1402/500000]
+ train/ActionL1Loss=0.0823
+ throughput/total_tokens=269,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1403/500000]
+ train/ActionL1Loss=0.0966
+ throughput/total_tokens=269,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1404/500000]
+ train/ActionL1Loss=0.1053
+ throughput/total_tokens=269,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1405/500000]
+ train/ActionL1Loss=0.0930
+ throughput/total_tokens=269,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1406/500000]
+ train/ActionL1Loss=0.0943
+ throughput/total_tokens=269,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1407/500000]
+ train/ActionL1Loss=0.0937
+ throughput/total_tokens=270,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1408/500000]
+ train/ActionL1Loss=0.0972
+ throughput/total_tokens=270,336,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1409/500000]
+ train/ActionL1Loss=0.0961
+ throughput/total_tokens=270,528,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1410/500000]
+ train/ActionL1Loss=0.0865
+ throughput/total_tokens=270,720,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1411/500000]
+ train/ActionL1Loss=0.0959
+ throughput/total_tokens=270,912,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1412/500000]
+ train/ActionL1Loss=0.1029
+ throughput/total_tokens=271,104,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1413/500000]
+ train/ActionL1Loss=0.0946
+ throughput/total_tokens=271,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1414/500000]
+ train/ActionL1Loss=0.1016
+ throughput/total_tokens=271,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1415/500000]
+ train/ActionL1Loss=0.0962
+ throughput/total_tokens=271,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1416/500000]
+ train/ActionL1Loss=0.1083
+ throughput/total_tokens=271,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1417/500000]
+ train/ActionL1Loss=0.1095
+ throughput/total_tokens=272,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1418/500000]
+ train/ActionL1Loss=0.1130
+ throughput/total_tokens=272,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1419/500000]
+ train/ActionL1Loss=0.0888
+ throughput/total_tokens=272,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1420/500000]
+ optim/total_grad_norm=10.66
+ train/ActionL1Loss=0.0996
+ throughput/total_tokens=272,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1421/500000]
+ train/ActionL1Loss=0.0984
+ throughput/total_tokens=272,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1422/500000]
+ train/ActionL1Loss=0.1099
+ throughput/total_tokens=273,024,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1423/500000]
+ train/ActionL1Loss=0.1078
+ throughput/total_tokens=273,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1424/500000]
+ train/ActionL1Loss=0.0927
+ throughput/total_tokens=273,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1425/500000]
+ train/ActionL1Loss=0.1010
+ throughput/total_tokens=273,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1426/500000]
+ train/ActionL1Loss=0.0973
+ throughput/total_tokens=273,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1427/500000]
+ train/ActionL1Loss=0.0897
+ throughput/total_tokens=273,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1428/500000]
+ train/ActionL1Loss=0.1248
+ throughput/total_tokens=274,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1429/500000]
+ train/ActionL1Loss=0.0916
+ throughput/total_tokens=274,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1430/500000]
+ train/ActionL1Loss=0.0986
+ throughput/total_tokens=274,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1431/500000]
+ train/ActionL1Loss=0.1138
+ throughput/total_tokens=274,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1432/500000]
+ train/ActionL1Loss=0.1183
+ throughput/total_tokens=274,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1433/500000]
+ train/ActionL1Loss=0.0928
+ throughput/total_tokens=275,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1434/500000]
+ train/ActionL1Loss=0.0750
+ throughput/total_tokens=275,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1435/500000]
+ train/ActionL1Loss=0.0971
+ throughput/total_tokens=275,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1436/500000]
+ train/ActionL1Loss=0.1015
+ throughput/total_tokens=275,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1437/500000]
+ train/ActionL1Loss=0.1003
+ throughput/total_tokens=275,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1438/500000]
+ train/ActionL1Loss=0.0794
+ throughput/total_tokens=276,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1439/500000]
+ train/ActionL1Loss=0.0815
+ throughput/total_tokens=276,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1440/500000]
+ optim/total_grad_norm=10.51
+ train/ActionL1Loss=0.1126
+ throughput/total_tokens=276,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1441/500000]
+ train/ActionL1Loss=0.1119
+ throughput/total_tokens=276,672,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1442/500000]
+ train/ActionL1Loss=0.0986
+ throughput/total_tokens=276,864,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=1443/500000]
+ train/ActionL1Loss=0.0896
+ throughput/total_tokens=277,056,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1444/500000]
+ train/ActionL1Loss=0.0911
+ throughput/total_tokens=277,248,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1445/500000]
+ train/ActionL1Loss=0.1099
+ throughput/total_tokens=277,440,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1446/500000]
+ train/ActionL1Loss=0.0962
+ throughput/total_tokens=277,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1447/500000]
+ train/ActionL1Loss=0.0794
+ throughput/total_tokens=277,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1448/500000]
+ train/ActionL1Loss=0.1073
+ throughput/total_tokens=278,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1449/500000]
+ train/ActionL1Loss=0.1130
+ throughput/total_tokens=278,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1450/500000]
+ train/ActionL1Loss=0.1023
+ throughput/total_tokens=278,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1451/500000]
+ train/ActionL1Loss=0.1049
+ throughput/total_tokens=278,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1452/500000]
+ train/ActionL1Loss=0.1002
+ throughput/total_tokens=278,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1453/500000]
+ train/ActionL1Loss=0.0991
+ throughput/total_tokens=278,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1454/500000]
+ train/ActionL1Loss=0.0969
+ throughput/total_tokens=279,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1455/500000]
+ train/ActionL1Loss=0.0910
+ throughput/total_tokens=279,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1456/500000]
+ train/ActionL1Loss=0.0870
+ throughput/total_tokens=279,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1457/500000]
+ train/ActionL1Loss=0.0836
+ throughput/total_tokens=279,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1458/500000]
+ train/ActionL1Loss=0.0949
+ throughput/total_tokens=279,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1459/500000]
+ train/ActionL1Loss=0.0989
+ throughput/total_tokens=280,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1460/500000]
+ optim/total_grad_norm=9.090
+ train/ActionL1Loss=0.0958
+ throughput/total_tokens=280,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1461/500000]
+ train/ActionL1Loss=0.0854
+ throughput/total_tokens=280,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1462/500000]
+ train/ActionL1Loss=0.0763
+ throughput/total_tokens=280,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1463/500000]
+ train/ActionL1Loss=0.0726
+ throughput/total_tokens=280,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1464/500000]
+ train/ActionL1Loss=0.0991
+ throughput/total_tokens=281,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1465/500000]
+ train/ActionL1Loss=0.0727
+ throughput/total_tokens=281,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1466/500000]
+ train/ActionL1Loss=0.0705
+ throughput/total_tokens=281,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1467/500000]
+ train/ActionL1Loss=0.0853
+ throughput/total_tokens=281,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1468/500000]
+ train/ActionL1Loss=0.1077
+ throughput/total_tokens=281,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1469/500000]
+ train/ActionL1Loss=0.0748
+ throughput/total_tokens=282,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1470/500000]
+ train/ActionL1Loss=0.0891
+ throughput/total_tokens=282,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1471/500000]
+ train/ActionL1Loss=0.0855
+ throughput/total_tokens=282,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1472/500000]
+ train/ActionL1Loss=0.0884
+ throughput/total_tokens=282,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1473/500000]
+ train/ActionL1Loss=0.0933
+ throughput/total_tokens=282,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1474/500000]
+ train/ActionL1Loss=0.0989
+ throughput/total_tokens=283,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1475/500000]
+ train/ActionL1Loss=0.0958
+ throughput/total_tokens=283,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1476/500000]
+ train/ActionL1Loss=0.1192
+ throughput/total_tokens=283,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1477/500000]
+ train/ActionL1Loss=0.0939
+ throughput/total_tokens=283,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1478/500000]
+ train/ActionL1Loss=0.0964
+ throughput/total_tokens=283,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1479/500000]
+ train/ActionL1Loss=0.0831
+ throughput/total_tokens=283,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1480/500000]
+ optim/total_grad_norm=9.954
+ train/ActionL1Loss=0.0933
+ throughput/total_tokens=284,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1481/500000]
+ train/ActionL1Loss=0.0797
+ throughput/total_tokens=284,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1482/500000]
+ train/ActionL1Loss=0.1001
+ throughput/total_tokens=284,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1483/500000]
+ train/ActionL1Loss=0.0790
+ throughput/total_tokens=284,736,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1484/500000]
+ train/ActionL1Loss=0.0872
+ throughput/total_tokens=284,928,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1485/500000]
+ train/ActionL1Loss=0.0891
+ throughput/total_tokens=285,120,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=1486/500000]
+ train/ActionL1Loss=0.0959
+ throughput/total_tokens=285,312,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1487/500000]
+ train/ActionL1Loss=0.1064
+ throughput/total_tokens=285,504,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1488/500000]
+ train/ActionL1Loss=0.0988
+ throughput/total_tokens=285,696,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1489/500000]
+ train/ActionL1Loss=0.0889
+ throughput/total_tokens=285,888,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1490/500000]
+ train/ActionL1Loss=0.0883
+ throughput/total_tokens=286,080,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1491/500000]
+ train/ActionL1Loss=0.1215
+ throughput/total_tokens=286,272,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1492/500000]
+ train/ActionL1Loss=0.1097
+ throughput/total_tokens=286,464,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1493/500000]
+ train/ActionL1Loss=0.1027
+ throughput/total_tokens=286,656,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1494/500000]
+ train/ActionL1Loss=0.0923
+ throughput/total_tokens=286,848,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1495/500000]
+ train/ActionL1Loss=0.1076
+ throughput/total_tokens=287,040,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1496/500000]
+ train/ActionL1Loss=0.0949
+ throughput/total_tokens=287,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1497/500000]
+ train/ActionL1Loss=0.0881
+ throughput/total_tokens=287,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1498/500000]
+ train/ActionL1Loss=0.0900
+ throughput/total_tokens=287,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1499/500000]
+ train/ActionL1Loss=0.0716
+ throughput/total_tokens=287,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1500/500000]
+ optim/total_grad_norm=10.34
+ train/ActionL1Loss=0.0804
+ throughput/total_tokens=288,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/03 [01:16:02] INFO | >> Saving config... checkpoint.py:608
+10/03 [01:16:48] INFO | >> Saving model state... checkpoint.py:796
+10/03 [01:17:59] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [01:19:29] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1501/500000]
+ train/ActionL1Loss=0.1010
+ throughput/total_tokens=288,192,000
+ throughput/device/tokens_per_second=1,219
+ throughput/device/batches_per_second=0.0508
+[step=1502/500000]
+ train/ActionL1Loss=0.0932
+ throughput/total_tokens=288,384,000
+ throughput/device/tokens_per_second=1,195
+ throughput/device/batches_per_second=0.0498
+[step=1503/500000]
+ train/ActionL1Loss=0.1048
+ throughput/total_tokens=288,576,000
+ throughput/device/tokens_per_second=1,192
+ throughput/device/batches_per_second=0.0497
+[step=1504/500000]
+ train/ActionL1Loss=0.1108
+ throughput/total_tokens=288,768,000
+ throughput/device/tokens_per_second=1,192
+ throughput/device/batches_per_second=0.0497
+[step=1505/500000]
+ train/ActionL1Loss=0.1062
+ throughput/total_tokens=288,960,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0497
+[step=1506/500000]
+ train/ActionL1Loss=0.0945
+ throughput/total_tokens=289,152,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0496
+[step=1507/500000]
+ train/ActionL1Loss=0.0861
+ throughput/total_tokens=289,344,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=1508/500000]
+ train/ActionL1Loss=0.0906
+ throughput/total_tokens=289,536,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=1509/500000]
+ train/ActionL1Loss=0.1006
+ throughput/total_tokens=289,728,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=1510/500000]
+ train/ActionL1Loss=0.0997
+ throughput/total_tokens=289,920,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=1511/500000]
+ train/ActionL1Loss=0.0851
+ throughput/total_tokens=290,112,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=1512/500000]
+ train/ActionL1Loss=0.0788
+ throughput/total_tokens=290,304,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1513/500000]
+ train/ActionL1Loss=0.0971
+ throughput/total_tokens=290,496,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1514/500000]
+ train/ActionL1Loss=0.0931
+ throughput/total_tokens=290,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1515/500000]
+ train/ActionL1Loss=0.0998
+ throughput/total_tokens=290,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1516/500000]
+ train/ActionL1Loss=0.0704
+ throughput/total_tokens=291,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1517/500000]
+ train/ActionL1Loss=0.0856
+ throughput/total_tokens=291,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1518/500000]
+ train/ActionL1Loss=0.0913
+ throughput/total_tokens=291,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1519/500000]
+ train/ActionL1Loss=0.0727
+ throughput/total_tokens=291,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1520/500000]
+ optim/total_grad_norm=10.28
+ train/ActionL1Loss=0.1119
+ throughput/total_tokens=291,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1521/500000]
+ train/ActionL1Loss=0.0967
+ throughput/total_tokens=292,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1522/500000]
+ train/ActionL1Loss=0.0692
+ throughput/total_tokens=292,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1523/500000]
+ train/ActionL1Loss=0.0806
+ throughput/total_tokens=292,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1524/500000]
+ train/ActionL1Loss=0.0747
+ throughput/total_tokens=292,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1525/500000]
+ train/ActionL1Loss=0.0822
+ throughput/total_tokens=292,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1526/500000]
+ train/ActionL1Loss=0.0908
+ throughput/total_tokens=292,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1527/500000]
+ train/ActionL1Loss=0.0802
+ throughput/total_tokens=293,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1528/500000]
+ train/ActionL1Loss=0.0797
+ throughput/total_tokens=293,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1529/500000]
+ train/ActionL1Loss=0.0835
+ throughput/total_tokens=293,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1530/500000]
+ train/ActionL1Loss=0.0647
+ throughput/total_tokens=293,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1531/500000]
+ train/ActionL1Loss=0.0819
+ throughput/total_tokens=293,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1532/500000]
+ train/ActionL1Loss=0.0839
+ throughput/total_tokens=294,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1533/500000]
+ train/ActionL1Loss=0.0791
+ throughput/total_tokens=294,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1534/500000]
+ train/ActionL1Loss=0.0789
+ throughput/total_tokens=294,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1535/500000]
+ train/ActionL1Loss=0.0729
+ throughput/total_tokens=294,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1536/500000]
+ train/ActionL1Loss=0.0925
+ throughput/total_tokens=294,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1537/500000]
+ train/ActionL1Loss=0.0733
+ throughput/total_tokens=295,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1538/500000]
+ train/ActionL1Loss=0.0671
+ throughput/total_tokens=295,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1539/500000]
+ train/ActionL1Loss=0.0863
+ throughput/total_tokens=295,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1540/500000]
+ optim/total_grad_norm=10.06
+ train/ActionL1Loss=0.0744
+ throughput/total_tokens=295,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1541/500000]
+ train/ActionL1Loss=0.0713
+ throughput/total_tokens=295,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1542/500000]
+ train/ActionL1Loss=0.1020
+ throughput/total_tokens=296,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1543/500000]
+ train/ActionL1Loss=0.0881
+ throughput/total_tokens=296,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1544/500000]
+ train/ActionL1Loss=0.0898
+ throughput/total_tokens=296,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1545/500000]
+ train/ActionL1Loss=0.0725
+ throughput/total_tokens=296,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1546/500000]
+ train/ActionL1Loss=0.1027
+ throughput/total_tokens=296,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1547/500000]
+ train/ActionL1Loss=0.0985
+ throughput/total_tokens=297,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1548/500000]
+ train/ActionL1Loss=0.1036
+ throughput/total_tokens=297,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1549/500000]
+ train/ActionL1Loss=0.0872
+ throughput/total_tokens=297,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1550/500000]
+ train/ActionL1Loss=0.0968
+ throughput/total_tokens=297,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1551/500000]
+ train/ActionL1Loss=0.0976
+ throughput/total_tokens=297,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1552/500000]
+ train/ActionL1Loss=0.1206
+ throughput/total_tokens=297,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1553/500000]
+ train/ActionL1Loss=0.1040
+ throughput/total_tokens=298,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1554/500000]
+ train/ActionL1Loss=0.1125
+ throughput/total_tokens=298,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1555/500000]
+ train/ActionL1Loss=0.1089
+ throughput/total_tokens=298,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1556/500000]
+ train/ActionL1Loss=0.0941
+ throughput/total_tokens=298,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1557/500000]
+ train/ActionL1Loss=0.0974
+ throughput/total_tokens=298,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1558/500000]
+ train/ActionL1Loss=0.1025
+ throughput/total_tokens=299,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1559/500000]
+ train/ActionL1Loss=0.0828
+ throughput/total_tokens=299,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1560/500000]
+ optim/total_grad_norm=8.787
+ train/ActionL1Loss=0.0759
+ throughput/total_tokens=299,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1561/500000]
+ train/ActionL1Loss=0.0942
+ throughput/total_tokens=299,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1562/500000]
+ train/ActionL1Loss=0.0736
+ throughput/total_tokens=299,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1563/500000]
+ train/ActionL1Loss=0.0743
+ throughput/total_tokens=300,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1564/500000]
+ train/ActionL1Loss=0.1048
+ throughput/total_tokens=300,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1565/500000]
+ train/ActionL1Loss=0.0864
+ throughput/total_tokens=300,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1566/500000]
+ train/ActionL1Loss=0.0772
+ throughput/total_tokens=300,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1567/500000]
+ train/ActionL1Loss=0.1026
+ throughput/total_tokens=300,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1568/500000]
+ train/ActionL1Loss=0.0956
+ throughput/total_tokens=301,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1569/500000]
+ train/ActionL1Loss=0.0997
+ throughput/total_tokens=301,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1570/500000]
+ train/ActionL1Loss=0.0773
+ throughput/total_tokens=301,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1571/500000]
+ train/ActionL1Loss=0.0930
+ throughput/total_tokens=301,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1572/500000]
+ train/ActionL1Loss=0.0786
+ throughput/total_tokens=301,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1573/500000]
+ train/ActionL1Loss=0.0958
+ throughput/total_tokens=302,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1574/500000]
+ train/ActionL1Loss=0.1490
+ throughput/total_tokens=302,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1575/500000]
+ train/ActionL1Loss=0.0887
+ throughput/total_tokens=302,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1576/500000]
+ train/ActionL1Loss=0.0930
+ throughput/total_tokens=302,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1577/500000]
+ train/ActionL1Loss=0.1654
+ throughput/total_tokens=302,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1578/500000]
+ train/ActionL1Loss=0.1053
+ throughput/total_tokens=302,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1579/500000]
+ train/ActionL1Loss=0.1550
+ throughput/total_tokens=303,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1580/500000]
+ optim/total_grad_norm=9.484
+ train/ActionL1Loss=0.0990
+ throughput/total_tokens=303,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1581/500000]
+ train/ActionL1Loss=0.0769
+ throughput/total_tokens=303,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1582/500000]
+ train/ActionL1Loss=0.0833
+ throughput/total_tokens=303,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1583/500000]
+ train/ActionL1Loss=0.0916
+ throughput/total_tokens=303,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1584/500000]
+ train/ActionL1Loss=0.0913
+ throughput/total_tokens=304,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1585/500000]
+ train/ActionL1Loss=0.0813
+ throughput/total_tokens=304,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1586/500000]
+ train/ActionL1Loss=0.0950
+ throughput/total_tokens=304,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1587/500000]
+ train/ActionL1Loss=0.0748
+ throughput/total_tokens=304,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1588/500000]
+ train/ActionL1Loss=0.0808
+ throughput/total_tokens=304,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1589/500000]
+ train/ActionL1Loss=0.0865
+ throughput/total_tokens=305,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1590/500000]
+ train/ActionL1Loss=0.0978
+ throughput/total_tokens=305,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1591/500000]
+ train/ActionL1Loss=0.0774
+ throughput/total_tokens=305,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1592/500000]
+ train/ActionL1Loss=0.0919
+ throughput/total_tokens=305,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1593/500000]
+ train/ActionL1Loss=0.0906
+ throughput/total_tokens=305,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1594/500000]
+ train/ActionL1Loss=0.0940
+ throughput/total_tokens=306,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1595/500000]
+ train/ActionL1Loss=0.0847
+ throughput/total_tokens=306,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1596/500000]
+ train/ActionL1Loss=0.0794
+ throughput/total_tokens=306,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1597/500000]
+ train/ActionL1Loss=0.0771
+ throughput/total_tokens=306,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1598/500000]
+ train/ActionL1Loss=0.0985
+ throughput/total_tokens=306,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1599/500000]
+ train/ActionL1Loss=0.0861
+ throughput/total_tokens=307,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1600/500000]
+ optim/total_grad_norm=9.144
+ train/ActionL1Loss=0.0968
+ throughput/total_tokens=307,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1601/500000]
+ train/ActionL1Loss=0.0862
+ throughput/total_tokens=307,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1602/500000]
+ train/ActionL1Loss=0.0917
+ throughput/total_tokens=307,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1603/500000]
+ train/ActionL1Loss=0.1116
+ throughput/total_tokens=307,776,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1604/500000]
+ train/ActionL1Loss=0.0936
+ throughput/total_tokens=307,968,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1605/500000]
+ train/ActionL1Loss=0.1015
+ throughput/total_tokens=308,160,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1606/500000]
+ train/ActionL1Loss=0.1015
+ throughput/total_tokens=308,352,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1607/500000]
+ train/ActionL1Loss=0.0913
+ throughput/total_tokens=308,544,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1608/500000]
+ train/ActionL1Loss=0.0977
+ throughput/total_tokens=308,736,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1609/500000]
+ train/ActionL1Loss=0.0802
+ throughput/total_tokens=308,928,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1610/500000]
+ train/ActionL1Loss=0.0849
+ throughput/total_tokens=309,120,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1611/500000]
+ train/ActionL1Loss=0.0825
+ throughput/total_tokens=309,312,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1612/500000]
+ train/ActionL1Loss=0.1081
+ throughput/total_tokens=309,504,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1613/500000]
+ train/ActionL1Loss=0.0881
+ throughput/total_tokens=309,696,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1614/500000]
+ train/ActionL1Loss=0.0697
+ throughput/total_tokens=309,888,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1615/500000]
+ train/ActionL1Loss=0.0832
+ throughput/total_tokens=310,080,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1616/500000]
+ train/ActionL1Loss=0.0842
+ throughput/total_tokens=310,272,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1617/500000]
+ train/ActionL1Loss=0.0793
+ throughput/total_tokens=310,464,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1618/500000]
+ train/ActionL1Loss=0.0797
+ throughput/total_tokens=310,656,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1619/500000]
+ train/ActionL1Loss=0.0980
+ throughput/total_tokens=310,848,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1620/500000]
+ optim/total_grad_norm=9.280
+ train/ActionL1Loss=0.1078
+ throughput/total_tokens=311,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1621/500000]
+ train/ActionL1Loss=0.0851
+ throughput/total_tokens=311,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1622/500000]
+ train/ActionL1Loss=0.0817
+ throughput/total_tokens=311,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1623/500000]
+ train/ActionL1Loss=0.0790
+ throughput/total_tokens=311,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1624/500000]
+ train/ActionL1Loss=0.0791
+ throughput/total_tokens=311,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1625/500000]
+ train/ActionL1Loss=0.0799
+ throughput/total_tokens=312,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1626/500000]
+ train/ActionL1Loss=0.0738
+ throughput/total_tokens=312,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1627/500000]
+ train/ActionL1Loss=0.0798
+ throughput/total_tokens=312,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1628/500000]
+ train/ActionL1Loss=0.0975
+ throughput/total_tokens=312,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1629/500000]
+ train/ActionL1Loss=0.0807
+ throughput/total_tokens=312,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1630/500000]
+ train/ActionL1Loss=0.0915
+ throughput/total_tokens=312,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1631/500000]
+ train/ActionL1Loss=0.0882
+ throughput/total_tokens=313,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1632/500000]
+ train/ActionL1Loss=0.0938
+ throughput/total_tokens=313,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1633/500000]
+ train/ActionL1Loss=0.0906
+ throughput/total_tokens=313,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1634/500000]
+ train/ActionL1Loss=0.0882
+ throughput/total_tokens=313,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1635/500000]
+ train/ActionL1Loss=0.0959
+ throughput/total_tokens=313,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1636/500000]
+ train/ActionL1Loss=0.1119
+ throughput/total_tokens=314,112,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1637/500000]
+ train/ActionL1Loss=0.0959
+ throughput/total_tokens=314,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1638/500000]
+ train/ActionL1Loss=0.0852
+ throughput/total_tokens=314,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1639/500000]
+ train/ActionL1Loss=0.0944
+ throughput/total_tokens=314,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1640/500000]
+ optim/total_grad_norm=11.48
+ train/ActionL1Loss=0.0756
+ throughput/total_tokens=314,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1641/500000]
+ train/ActionL1Loss=0.0894
+ throughput/total_tokens=315,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1642/500000]
+ train/ActionL1Loss=0.0730
+ throughput/total_tokens=315,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1643/500000]
+ train/ActionL1Loss=0.0739
+ throughput/total_tokens=315,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1644/500000]
+ train/ActionL1Loss=0.0664
+ throughput/total_tokens=315,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1645/500000]
+ train/ActionL1Loss=0.0729
+ throughput/total_tokens=315,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1646/500000]
+ train/ActionL1Loss=0.1167
+ throughput/total_tokens=316,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1647/500000]
+ train/ActionL1Loss=0.0710
+ throughput/total_tokens=316,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1648/500000]
+ train/ActionL1Loss=0.0769
+ throughput/total_tokens=316,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1649/500000]
+ train/ActionL1Loss=0.0746
+ throughput/total_tokens=316,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1650/500000]
+ train/ActionL1Loss=0.0861
+ throughput/total_tokens=316,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1651/500000]
+ train/ActionL1Loss=0.0842
+ throughput/total_tokens=316,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1652/500000]
+ train/ActionL1Loss=0.0881
+ throughput/total_tokens=317,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1653/500000]
+ train/ActionL1Loss=0.0785
+ throughput/total_tokens=317,376,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1654/500000]
+ train/ActionL1Loss=0.0846
+ throughput/total_tokens=317,568,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=1655/500000]
+ train/ActionL1Loss=0.0976
+ throughput/total_tokens=317,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1656/500000]
+ train/ActionL1Loss=0.0851
+ throughput/total_tokens=317,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1657/500000]
+ train/ActionL1Loss=0.0752
+ throughput/total_tokens=318,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1658/500000]
+ train/ActionL1Loss=0.0815
+ throughput/total_tokens=318,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1659/500000]
+ train/ActionL1Loss=0.0740
+ throughput/total_tokens=318,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1660/500000]
+ optim/total_grad_norm=9.659
+ train/ActionL1Loss=0.0922
+ throughput/total_tokens=318,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1661/500000]
+ train/ActionL1Loss=0.0965
+ throughput/total_tokens=318,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1662/500000]
+ train/ActionL1Loss=0.0758
+ throughput/total_tokens=319,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1663/500000]
+ train/ActionL1Loss=0.0913
+ throughput/total_tokens=319,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1664/500000]
+ train/ActionL1Loss=0.0871
+ throughput/total_tokens=319,488,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1665/500000]
+ train/ActionL1Loss=0.0778
+ throughput/total_tokens=319,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1666/500000]
+ train/ActionL1Loss=0.0803
+ throughput/total_tokens=319,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1667/500000]
+ train/ActionL1Loss=0.0806
+ throughput/total_tokens=320,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1668/500000]
+ train/ActionL1Loss=0.0783
+ throughput/total_tokens=320,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1669/500000]
+ train/ActionL1Loss=0.0911
+ throughput/total_tokens=320,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1670/500000]
+ train/ActionL1Loss=0.0843
+ throughput/total_tokens=320,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1671/500000]
+ train/ActionL1Loss=0.0753
+ throughput/total_tokens=320,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1672/500000]
+ train/ActionL1Loss=0.0653
+ throughput/total_tokens=321,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1673/500000]
+ train/ActionL1Loss=0.0975
+ throughput/total_tokens=321,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1674/500000]
+ train/ActionL1Loss=0.0976
+ throughput/total_tokens=321,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1675/500000]
+ train/ActionL1Loss=0.0772
+ throughput/total_tokens=321,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1676/500000]
+ train/ActionL1Loss=0.0799
+ throughput/total_tokens=321,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1677/500000]
+ train/ActionL1Loss=0.0768
+ throughput/total_tokens=321,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1678/500000]
+ train/ActionL1Loss=0.0666
+ throughput/total_tokens=322,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1679/500000]
+ train/ActionL1Loss=0.0902
+ throughput/total_tokens=322,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1680/500000]
+ optim/total_grad_norm=7.778
+ train/ActionL1Loss=0.0831
+ throughput/total_tokens=322,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1681/500000]
+ train/ActionL1Loss=0.0730
+ throughput/total_tokens=322,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1682/500000]
+ train/ActionL1Loss=0.0793
+ throughput/total_tokens=322,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1683/500000]
+ train/ActionL1Loss=0.0871
+ throughput/total_tokens=323,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1684/500000]
+ train/ActionL1Loss=0.0762
+ throughput/total_tokens=323,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1685/500000]
+ train/ActionL1Loss=0.0887
+ throughput/total_tokens=323,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1686/500000]
+ train/ActionL1Loss=0.0774
+ throughput/total_tokens=323,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1687/500000]
+ train/ActionL1Loss=0.0856
+ throughput/total_tokens=323,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1688/500000]
+ train/ActionL1Loss=0.0768
+ throughput/total_tokens=324,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1689/500000]
+ train/ActionL1Loss=0.0875
+ throughput/total_tokens=324,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1690/500000]
+ train/ActionL1Loss=0.0790
+ throughput/total_tokens=324,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1691/500000]
+ train/ActionL1Loss=0.0911
+ throughput/total_tokens=324,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1692/500000]
+ train/ActionL1Loss=0.1109
+ throughput/total_tokens=324,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1693/500000]
+ train/ActionL1Loss=0.1026
+ throughput/total_tokens=325,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1694/500000]
+ train/ActionL1Loss=0.0933
+ throughput/total_tokens=325,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1695/500000]
+ train/ActionL1Loss=0.1008
+ throughput/total_tokens=325,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1696/500000]
+ train/ActionL1Loss=0.0944
+ throughput/total_tokens=325,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1697/500000]
+ train/ActionL1Loss=0.0865
+ throughput/total_tokens=325,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1698/500000]
+ train/ActionL1Loss=0.0856
+ throughput/total_tokens=326,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1699/500000]
+ train/ActionL1Loss=0.0664
+ throughput/total_tokens=326,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1700/500000]
+ optim/total_grad_norm=9.073
+ train/ActionL1Loss=0.0943
+ throughput/total_tokens=326,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1701/500000]
+ train/ActionL1Loss=0.0861
+ throughput/total_tokens=326,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1702/500000]
+ train/ActionL1Loss=0.1083
+ throughput/total_tokens=326,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1703/500000]
+ train/ActionL1Loss=0.0854
+ throughput/total_tokens=326,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1704/500000]
+ train/ActionL1Loss=0.0784
+ throughput/total_tokens=327,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1705/500000]
+ train/ActionL1Loss=0.0928
+ throughput/total_tokens=327,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1706/500000]
+ train/ActionL1Loss=0.0881
+ throughput/total_tokens=327,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1707/500000]
+ train/ActionL1Loss=0.0860
+ throughput/total_tokens=327,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1708/500000]
+ train/ActionL1Loss=0.0827
+ throughput/total_tokens=327,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1709/500000]
+ train/ActionL1Loss=0.0929
+ throughput/total_tokens=328,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1710/500000]
+ train/ActionL1Loss=0.0921
+ throughput/total_tokens=328,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1711/500000]
+ train/ActionL1Loss=0.0773
+ throughput/total_tokens=328,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1712/500000]
+ train/ActionL1Loss=0.0895
+ throughput/total_tokens=328,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1713/500000]
+ train/ActionL1Loss=0.0819
+ throughput/total_tokens=328,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1714/500000]
+ train/ActionL1Loss=0.0714
+ throughput/total_tokens=329,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1715/500000]
+ train/ActionL1Loss=0.0745
+ throughput/total_tokens=329,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1716/500000]
+ train/ActionL1Loss=0.0776
+ throughput/total_tokens=329,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1717/500000]
+ train/ActionL1Loss=0.0752
+ throughput/total_tokens=329,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1718/500000]
+ train/ActionL1Loss=0.0686
+ throughput/total_tokens=329,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1719/500000]
+ train/ActionL1Loss=0.0773
+ throughput/total_tokens=330,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1720/500000]
+ optim/total_grad_norm=7.937
+ train/ActionL1Loss=0.0826
+ throughput/total_tokens=330,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1721/500000]
+ train/ActionL1Loss=0.0722
+ throughput/total_tokens=330,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1722/500000]
+ train/ActionL1Loss=0.0932
+ throughput/total_tokens=330,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1723/500000]
+ train/ActionL1Loss=0.0898
+ throughput/total_tokens=330,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1724/500000]
+ train/ActionL1Loss=0.0801
+ throughput/total_tokens=331,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1725/500000]
+ train/ActionL1Loss=0.0657
+ throughput/total_tokens=331,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1726/500000]
+ train/ActionL1Loss=0.0736
+ throughput/total_tokens=331,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1727/500000]
+ train/ActionL1Loss=0.0867
+ throughput/total_tokens=331,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1728/500000]
+ train/ActionL1Loss=0.1381
+ throughput/total_tokens=331,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1729/500000]
+ train/ActionL1Loss=0.0684
+ throughput/total_tokens=331,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1730/500000]
+ train/ActionL1Loss=0.0851
+ throughput/total_tokens=332,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1731/500000]
+ train/ActionL1Loss=0.0822
+ throughput/total_tokens=332,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1732/500000]
+ train/ActionL1Loss=0.0809
+ throughput/total_tokens=332,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1733/500000]
+ train/ActionL1Loss=0.0817
+ throughput/total_tokens=332,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1734/500000]
+ train/ActionL1Loss=0.0882
+ throughput/total_tokens=332,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1735/500000]
+ train/ActionL1Loss=0.0956
+ throughput/total_tokens=333,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1736/500000]
+ train/ActionL1Loss=0.0800
+ throughput/total_tokens=333,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1737/500000]
+ train/ActionL1Loss=0.0904
+ throughput/total_tokens=333,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1738/500000]
+ train/ActionL1Loss=0.0808
+ throughput/total_tokens=333,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1739/500000]
+ train/ActionL1Loss=0.0804
+ throughput/total_tokens=333,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1740/500000]
+ optim/total_grad_norm=8.932
+ train/ActionL1Loss=0.0966
+ throughput/total_tokens=334,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1741/500000]
+ train/ActionL1Loss=0.0645
+ throughput/total_tokens=334,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1742/500000]
+ train/ActionL1Loss=0.0789
+ throughput/total_tokens=334,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1743/500000]
+ train/ActionL1Loss=0.0853
+ throughput/total_tokens=334,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1744/500000]
+ train/ActionL1Loss=0.0783
+ throughput/total_tokens=334,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1745/500000]
+ train/ActionL1Loss=0.0748
+ throughput/total_tokens=335,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1746/500000]
+ train/ActionL1Loss=0.0772
+ throughput/total_tokens=335,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1747/500000]
+ train/ActionL1Loss=0.0796
+ throughput/total_tokens=335,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1748/500000]
+ train/ActionL1Loss=0.0713
+ throughput/total_tokens=335,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1749/500000]
+ train/ActionL1Loss=0.0802
+ throughput/total_tokens=335,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1750/500000]
+ train/ActionL1Loss=0.0782
+ throughput/total_tokens=336,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1751/500000]
+ train/ActionL1Loss=0.0811
+ throughput/total_tokens=336,192,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1752/500000]
+ train/ActionL1Loss=0.0890
+ throughput/total_tokens=336,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1753/500000]
+ train/ActionL1Loss=0.0843
+ throughput/total_tokens=336,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1754/500000]
+ train/ActionL1Loss=0.0697
+ throughput/total_tokens=336,768,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1755/500000]
+ train/ActionL1Loss=0.0862
+ throughput/total_tokens=336,960,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1756/500000]
+ train/ActionL1Loss=0.0800
+ throughput/total_tokens=337,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1757/500000]
+ train/ActionL1Loss=0.0735
+ throughput/total_tokens=337,344,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1758/500000]
+ train/ActionL1Loss=0.0867
+ throughput/total_tokens=337,536,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1759/500000]
+ train/ActionL1Loss=0.0760
+ throughput/total_tokens=337,728,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1760/500000]
+ optim/total_grad_norm=9.075
+ train/ActionL1Loss=0.0746
+ throughput/total_tokens=337,920,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1761/500000]
+ train/ActionL1Loss=0.0765
+ throughput/total_tokens=338,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1762/500000]
+ train/ActionL1Loss=0.0940
+ throughput/total_tokens=338,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1763/500000]
+ train/ActionL1Loss=0.0823
+ throughput/total_tokens=338,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1764/500000]
+ train/ActionL1Loss=0.1104
+ throughput/total_tokens=338,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1765/500000]
+ train/ActionL1Loss=0.1098
+ throughput/total_tokens=338,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1766/500000]
+ train/ActionL1Loss=0.0902
+ throughput/total_tokens=339,072,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1767/500000]
+ train/ActionL1Loss=0.0850
+ throughput/total_tokens=339,264,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1768/500000]
+ train/ActionL1Loss=0.0999
+ throughput/total_tokens=339,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1769/500000]
+ train/ActionL1Loss=0.0918
+ throughput/total_tokens=339,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1770/500000]
+ train/ActionL1Loss=0.0822
+ throughput/total_tokens=339,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1771/500000]
+ train/ActionL1Loss=0.0765
+ throughput/total_tokens=340,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1772/500000]
+ train/ActionL1Loss=0.0856
+ throughput/total_tokens=340,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1773/500000]
+ train/ActionL1Loss=0.0802
+ throughput/total_tokens=340,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1774/500000]
+ train/ActionL1Loss=0.0856
+ throughput/total_tokens=340,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1775/500000]
+ train/ActionL1Loss=0.0897
+ throughput/total_tokens=340,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1776/500000]
+ train/ActionL1Loss=0.0871
+ throughput/total_tokens=340,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1777/500000]
+ train/ActionL1Loss=0.0816
+ throughput/total_tokens=341,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1778/500000]
+ train/ActionL1Loss=0.0791
+ throughput/total_tokens=341,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1779/500000]
+ train/ActionL1Loss=0.0815
+ throughput/total_tokens=341,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1780/500000]
+ optim/total_grad_norm=10.09
+ train/ActionL1Loss=0.1003
+ throughput/total_tokens=341,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1781/500000]
+ train/ActionL1Loss=0.0946
+ throughput/total_tokens=341,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1782/500000]
+ train/ActionL1Loss=0.1075
+ throughput/total_tokens=342,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1783/500000]
+ train/ActionL1Loss=0.1010
+ throughput/total_tokens=342,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1784/500000]
+ train/ActionL1Loss=0.0896
+ throughput/total_tokens=342,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1785/500000]
+ train/ActionL1Loss=0.0907
+ throughput/total_tokens=342,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1786/500000]
+ train/ActionL1Loss=0.0850
+ throughput/total_tokens=342,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1787/500000]
+ train/ActionL1Loss=0.0894
+ throughput/total_tokens=343,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1788/500000]
+ train/ActionL1Loss=0.0785
+ throughput/total_tokens=343,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1789/500000]
+ train/ActionL1Loss=0.0981
+ throughput/total_tokens=343,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1790/500000]
+ train/ActionL1Loss=0.0957
+ throughput/total_tokens=343,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1791/500000]
+ train/ActionL1Loss=0.0851
+ throughput/total_tokens=343,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1792/500000]
+ train/ActionL1Loss=0.0961
+ throughput/total_tokens=344,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1793/500000]
+ train/ActionL1Loss=0.0822
+ throughput/total_tokens=344,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1794/500000]
+ train/ActionL1Loss=0.1018
+ throughput/total_tokens=344,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1795/500000]
+ train/ActionL1Loss=0.0967
+ throughput/total_tokens=344,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1796/500000]
+ train/ActionL1Loss=0.0821
+ throughput/total_tokens=344,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1797/500000]
+ train/ActionL1Loss=0.1002
+ throughput/total_tokens=345,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1798/500000]
+ train/ActionL1Loss=0.0807
+ throughput/total_tokens=345,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1799/500000]
+ train/ActionL1Loss=0.0780
+ throughput/total_tokens=345,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1800/500000]
+ optim/total_grad_norm=9.562
+ train/ActionL1Loss=0.0827
+ throughput/total_tokens=345,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1801/500000]
+ train/ActionL1Loss=0.0832
+ throughput/total_tokens=345,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1802/500000]
+ train/ActionL1Loss=0.0806
+ throughput/total_tokens=345,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1803/500000]
+ train/ActionL1Loss=0.0868
+ throughput/total_tokens=346,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1804/500000]
+ train/ActionL1Loss=0.0707
+ throughput/total_tokens=346,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1805/500000]
+ train/ActionL1Loss=0.0697
+ throughput/total_tokens=346,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1806/500000]
+ train/ActionL1Loss=0.0677
+ throughput/total_tokens=346,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1807/500000]
+ train/ActionL1Loss=0.0725
+ throughput/total_tokens=346,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1808/500000]
+ train/ActionL1Loss=0.0687
+ throughput/total_tokens=347,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1809/500000]
+ train/ActionL1Loss=0.0725
+ throughput/total_tokens=347,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1810/500000]
+ train/ActionL1Loss=0.0803
+ throughput/total_tokens=347,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1811/500000]
+ train/ActionL1Loss=0.0673
+ throughput/total_tokens=347,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1812/500000]
+ train/ActionL1Loss=0.0675
+ throughput/total_tokens=347,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1813/500000]
+ train/ActionL1Loss=0.0752
+ throughput/total_tokens=348,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1814/500000]
+ train/ActionL1Loss=0.0858
+ throughput/total_tokens=348,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1815/500000]
+ train/ActionL1Loss=0.0998
+ throughput/total_tokens=348,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1816/500000]
+ train/ActionL1Loss=0.0700
+ throughput/total_tokens=348,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1817/500000]
+ train/ActionL1Loss=0.0984
+ throughput/total_tokens=348,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1818/500000]
+ train/ActionL1Loss=0.0761
+ throughput/total_tokens=349,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1819/500000]
+ train/ActionL1Loss=0.0785
+ throughput/total_tokens=349,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1820/500000]
+ optim/total_grad_norm=10.17
+ train/ActionL1Loss=0.0987
+ throughput/total_tokens=349,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1821/500000]
+ train/ActionL1Loss=0.0904
+ throughput/total_tokens=349,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1822/500000]
+ train/ActionL1Loss=0.0855
+ throughput/total_tokens=349,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1823/500000]
+ train/ActionL1Loss=0.0845
+ throughput/total_tokens=350,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1824/500000]
+ train/ActionL1Loss=0.0716
+ throughput/total_tokens=350,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1825/500000]
+ train/ActionL1Loss=0.0972
+ throughput/total_tokens=350,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1826/500000]
+ train/ActionL1Loss=0.0814
+ throughput/total_tokens=350,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1827/500000]
+ train/ActionL1Loss=0.1149
+ throughput/total_tokens=350,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1828/500000]
+ train/ActionL1Loss=0.0788
+ throughput/total_tokens=350,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1829/500000]
+ train/ActionL1Loss=0.0996
+ throughput/total_tokens=351,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1830/500000]
+ train/ActionL1Loss=0.0761
+ throughput/total_tokens=351,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1831/500000]
+ train/ActionL1Loss=0.0854
+ throughput/total_tokens=351,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1832/500000]
+ train/ActionL1Loss=0.0992
+ throughput/total_tokens=351,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1833/500000]
+ train/ActionL1Loss=0.0980
+ throughput/total_tokens=351,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1834/500000]
+ train/ActionL1Loss=0.0944
+ throughput/total_tokens=352,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1835/500000]
+ train/ActionL1Loss=0.0936
+ throughput/total_tokens=352,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1836/500000]
+ train/ActionL1Loss=0.1136
+ throughput/total_tokens=352,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1837/500000]
+ train/ActionL1Loss=0.1186
+ throughput/total_tokens=352,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1838/500000]
+ train/ActionL1Loss=0.1080
+ throughput/total_tokens=352,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1839/500000]
+ train/ActionL1Loss=0.1127
+ throughput/total_tokens=353,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1840/500000]
+ optim/total_grad_norm=9.572
+ train/ActionL1Loss=0.1264
+ throughput/total_tokens=353,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1841/500000]
+ train/ActionL1Loss=0.1167
+ throughput/total_tokens=353,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1842/500000]
+ train/ActionL1Loss=0.1060
+ throughput/total_tokens=353,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1843/500000]
+ train/ActionL1Loss=0.0902
+ throughput/total_tokens=353,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1844/500000]
+ train/ActionL1Loss=0.1038
+ throughput/total_tokens=354,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1845/500000]
+ train/ActionL1Loss=0.0927
+ throughput/total_tokens=354,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1846/500000]
+ train/ActionL1Loss=0.1316
+ throughput/total_tokens=354,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1847/500000]
+ train/ActionL1Loss=0.0933
+ throughput/total_tokens=354,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1848/500000]
+ train/ActionL1Loss=0.0973
+ throughput/total_tokens=354,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1849/500000]
+ train/ActionL1Loss=0.0942
+ throughput/total_tokens=355,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1850/500000]
+ train/ActionL1Loss=0.0861
+ throughput/total_tokens=355,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1851/500000]
+ train/ActionL1Loss=0.0933
+ throughput/total_tokens=355,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1852/500000]
+ train/ActionL1Loss=0.1059
+ throughput/total_tokens=355,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1853/500000]
+ train/ActionL1Loss=0.0900
+ throughput/total_tokens=355,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1854/500000]
+ train/ActionL1Loss=0.0884
+ throughput/total_tokens=355,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1855/500000]
+ train/ActionL1Loss=0.0748
+ throughput/total_tokens=356,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1856/500000]
+ train/ActionL1Loss=0.0858
+ throughput/total_tokens=356,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1857/500000]
+ train/ActionL1Loss=0.0898
+ throughput/total_tokens=356,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1858/500000]
+ train/ActionL1Loss=0.0958
+ throughput/total_tokens=356,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1859/500000]
+ train/ActionL1Loss=0.0910
+ throughput/total_tokens=356,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1860/500000]
+ optim/total_grad_norm=8.805
+ train/ActionL1Loss=0.0930
+ throughput/total_tokens=357,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1861/500000]
+ train/ActionL1Loss=0.0814
+ throughput/total_tokens=357,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1862/500000]
+ train/ActionL1Loss=0.0852
+ throughput/total_tokens=357,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1863/500000]
+ train/ActionL1Loss=0.0812
+ throughput/total_tokens=357,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1864/500000]
+ train/ActionL1Loss=0.0893
+ throughput/total_tokens=357,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1865/500000]
+ train/ActionL1Loss=0.0995
+ throughput/total_tokens=358,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1866/500000]
+ train/ActionL1Loss=0.1028
+ throughput/total_tokens=358,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1867/500000]
+ train/ActionL1Loss=0.0825
+ throughput/total_tokens=358,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1868/500000]
+ train/ActionL1Loss=0.0698
+ throughput/total_tokens=358,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1869/500000]
+ train/ActionL1Loss=0.0996
+ throughput/total_tokens=358,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1870/500000]
+ train/ActionL1Loss=0.0810
+ throughput/total_tokens=359,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1871/500000]
+ train/ActionL1Loss=0.0766
+ throughput/total_tokens=359,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1872/500000]
+ train/ActionL1Loss=0.0844
+ throughput/total_tokens=359,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1873/500000]
+ train/ActionL1Loss=0.0767
+ throughput/total_tokens=359,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1874/500000]
+ train/ActionL1Loss=0.0823
+ throughput/total_tokens=359,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1875/500000]
+ train/ActionL1Loss=0.0768
+ throughput/total_tokens=360,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1876/500000]
+ train/ActionL1Loss=0.1004
+ throughput/total_tokens=360,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1877/500000]
+ train/ActionL1Loss=0.0683
+ throughput/total_tokens=360,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1878/500000]
+ train/ActionL1Loss=0.0795
+ throughput/total_tokens=360,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1879/500000]
+ train/ActionL1Loss=0.0802
+ throughput/total_tokens=360,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1880/500000]
+ optim/total_grad_norm=8.366
+ train/ActionL1Loss=0.0856
+ throughput/total_tokens=360,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1881/500000]
+ train/ActionL1Loss=0.0792
+ throughput/total_tokens=361,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1882/500000]
+ train/ActionL1Loss=0.0683
+ throughput/total_tokens=361,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1883/500000]
+ train/ActionL1Loss=0.0749
+ throughput/total_tokens=361,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1884/500000]
+ train/ActionL1Loss=0.0812
+ throughput/total_tokens=361,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1885/500000]
+ train/ActionL1Loss=0.0823
+ throughput/total_tokens=361,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1886/500000]
+ train/ActionL1Loss=0.0842
+ throughput/total_tokens=362,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1887/500000]
+ train/ActionL1Loss=0.0830
+ throughput/total_tokens=362,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1888/500000]
+ train/ActionL1Loss=0.0833
+ throughput/total_tokens=362,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1889/500000]
+ train/ActionL1Loss=0.0744
+ throughput/total_tokens=362,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1890/500000]
+ train/ActionL1Loss=0.0666
+ throughput/total_tokens=362,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1891/500000]
+ train/ActionL1Loss=0.0875
+ throughput/total_tokens=363,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1892/500000]
+ train/ActionL1Loss=0.0739
+ throughput/total_tokens=363,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1893/500000]
+ train/ActionL1Loss=0.0641
+ throughput/total_tokens=363,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1894/500000]
+ train/ActionL1Loss=0.0712
+ throughput/total_tokens=363,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1895/500000]
+ train/ActionL1Loss=0.0684
+ throughput/total_tokens=363,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1896/500000]
+ train/ActionL1Loss=0.0757
+ throughput/total_tokens=364,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1897/500000]
+ train/ActionL1Loss=0.0754
+ throughput/total_tokens=364,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1898/500000]
+ train/ActionL1Loss=0.0778
+ throughput/total_tokens=364,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1899/500000]
+ train/ActionL1Loss=0.0903
+ throughput/total_tokens=364,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1900/500000]
+ optim/total_grad_norm=11.07
+ train/ActionL1Loss=0.0792
+ throughput/total_tokens=364,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1901/500000]
+ train/ActionL1Loss=0.1023
+ throughput/total_tokens=364,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1902/500000]
+ train/ActionL1Loss=0.0838
+ throughput/total_tokens=365,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1903/500000]
+ train/ActionL1Loss=0.0661
+ throughput/total_tokens=365,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1904/500000]
+ train/ActionL1Loss=0.0778
+ throughput/total_tokens=365,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1905/500000]
+ train/ActionL1Loss=0.0753
+ throughput/total_tokens=365,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1906/500000]
+ train/ActionL1Loss=0.0768
+ throughput/total_tokens=365,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1907/500000]
+ train/ActionL1Loss=0.0714
+ throughput/total_tokens=366,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1908/500000]
+ train/ActionL1Loss=0.0691
+ throughput/total_tokens=366,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1909/500000]
+ train/ActionL1Loss=0.0798
+ throughput/total_tokens=366,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1910/500000]
+ train/ActionL1Loss=0.0870
+ throughput/total_tokens=366,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=1911/500000]
+ train/ActionL1Loss=0.0742
+ throughput/total_tokens=366,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1912/500000]
+ train/ActionL1Loss=0.0584
+ throughput/total_tokens=367,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1913/500000]
+ train/ActionL1Loss=0.0800
+ throughput/total_tokens=367,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1914/500000]
+ train/ActionL1Loss=0.0920
+ throughput/total_tokens=367,488,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1915/500000]
+ train/ActionL1Loss=0.0843
+ throughput/total_tokens=367,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1916/500000]
+ train/ActionL1Loss=0.0832
+ throughput/total_tokens=367,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1917/500000]
+ train/ActionL1Loss=0.0888
+ throughput/total_tokens=368,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1918/500000]
+ train/ActionL1Loss=0.0832
+ throughput/total_tokens=368,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1919/500000]
+ train/ActionL1Loss=0.0755
+ throughput/total_tokens=368,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=1920/500000]
+ optim/total_grad_norm=7.356
+ train/ActionL1Loss=0.0820
+ throughput/total_tokens=368,640,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1921/500000]
+ train/ActionL1Loss=0.0760
+ throughput/total_tokens=368,832,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1922/500000]
+ train/ActionL1Loss=0.0932
+ throughput/total_tokens=369,024,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1923/500000]
+ train/ActionL1Loss=0.0824
+ throughput/total_tokens=369,216,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1924/500000]
+ train/ActionL1Loss=0.0875
+ throughput/total_tokens=369,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1925/500000]
+ train/ActionL1Loss=0.0782
+ throughput/total_tokens=369,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1926/500000]
+ train/ActionL1Loss=0.0702
+ throughput/total_tokens=369,792,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1927/500000]
+ train/ActionL1Loss=0.1108
+ throughput/total_tokens=369,984,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1928/500000]
+ train/ActionL1Loss=0.0876
+ throughput/total_tokens=370,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1929/500000]
+ train/ActionL1Loss=0.0945
+ throughput/total_tokens=370,368,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1930/500000]
+ train/ActionL1Loss=0.0840
+ throughput/total_tokens=370,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1931/500000]
+ train/ActionL1Loss=0.0797
+ throughput/total_tokens=370,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1932/500000]
+ train/ActionL1Loss=0.0953
+ throughput/total_tokens=370,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1933/500000]
+ train/ActionL1Loss=0.0932
+ throughput/total_tokens=371,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1934/500000]
+ train/ActionL1Loss=0.0917
+ throughput/total_tokens=371,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1935/500000]
+ train/ActionL1Loss=0.0794
+ throughput/total_tokens=371,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1936/500000]
+ train/ActionL1Loss=0.0700
+ throughput/total_tokens=371,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1937/500000]
+ train/ActionL1Loss=0.1100
+ throughput/total_tokens=371,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1938/500000]
+ train/ActionL1Loss=0.0779
+ throughput/total_tokens=372,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1939/500000]
+ train/ActionL1Loss=0.1070
+ throughput/total_tokens=372,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=1940/500000]
+ optim/total_grad_norm=8.476
+ train/ActionL1Loss=0.0972
+ throughput/total_tokens=372,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1941/500000]
+ train/ActionL1Loss=0.0852
+ throughput/total_tokens=372,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1942/500000]
+ train/ActionL1Loss=0.0910
+ throughput/total_tokens=372,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=1943/500000]
+ train/ActionL1Loss=0.0935
+ throughput/total_tokens=373,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1944/500000]
+ train/ActionL1Loss=0.0876
+ throughput/total_tokens=373,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1945/500000]
+ train/ActionL1Loss=0.0877
+ throughput/total_tokens=373,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1946/500000]
+ train/ActionL1Loss=0.0885
+ throughput/total_tokens=373,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1947/500000]
+ train/ActionL1Loss=0.0888
+ throughput/total_tokens=373,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1948/500000]
+ train/ActionL1Loss=0.0889
+ throughput/total_tokens=374,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1949/500000]
+ train/ActionL1Loss=0.0822
+ throughput/total_tokens=374,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1950/500000]
+ train/ActionL1Loss=0.0780
+ throughput/total_tokens=374,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1951/500000]
+ train/ActionL1Loss=0.0782
+ throughput/total_tokens=374,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1952/500000]
+ train/ActionL1Loss=0.0917
+ throughput/total_tokens=374,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1953/500000]
+ train/ActionL1Loss=0.1246
+ throughput/total_tokens=374,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1954/500000]
+ train/ActionL1Loss=0.0927
+ throughput/total_tokens=375,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1955/500000]
+ train/ActionL1Loss=0.0954
+ throughput/total_tokens=375,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1956/500000]
+ train/ActionL1Loss=0.0962
+ throughput/total_tokens=375,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1957/500000]
+ train/ActionL1Loss=0.0943
+ throughput/total_tokens=375,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=1958/500000]
+ train/ActionL1Loss=0.0997
+ throughput/total_tokens=375,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1959/500000]
+ train/ActionL1Loss=0.0762
+ throughput/total_tokens=376,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1960/500000]
+ optim/total_grad_norm=7.918
+ train/ActionL1Loss=0.0843
+ throughput/total_tokens=376,320,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=1961/500000]
+ train/ActionL1Loss=0.0985
+ throughput/total_tokens=376,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1962/500000]
+ train/ActionL1Loss=0.1145
+ throughput/total_tokens=376,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1963/500000]
+ train/ActionL1Loss=0.1007
+ throughput/total_tokens=376,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1964/500000]
+ train/ActionL1Loss=0.0884
+ throughput/total_tokens=377,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=1965/500000]
+ train/ActionL1Loss=0.1097
+ throughput/total_tokens=377,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1966/500000]
+ train/ActionL1Loss=0.0790
+ throughput/total_tokens=377,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1967/500000]
+ train/ActionL1Loss=0.1045
+ throughput/total_tokens=377,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1968/500000]
+ train/ActionL1Loss=0.1001
+ throughput/total_tokens=377,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1969/500000]
+ train/ActionL1Loss=0.0878
+ throughput/total_tokens=378,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=1970/500000]
+ train/ActionL1Loss=0.0931
+ throughput/total_tokens=378,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1971/500000]
+ train/ActionL1Loss=0.1036
+ throughput/total_tokens=378,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1972/500000]
+ train/ActionL1Loss=0.0803
+ throughput/total_tokens=378,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1973/500000]
+ train/ActionL1Loss=0.1155
+ throughput/total_tokens=378,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1974/500000]
+ train/ActionL1Loss=0.0995
+ throughput/total_tokens=379,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1975/500000]
+ train/ActionL1Loss=0.1041
+ throughput/total_tokens=379,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1976/500000]
+ train/ActionL1Loss=0.0980
+ throughput/total_tokens=379,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1977/500000]
+ train/ActionL1Loss=0.1330
+ throughput/total_tokens=379,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1978/500000]
+ train/ActionL1Loss=0.0937
+ throughput/total_tokens=379,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1979/500000]
+ train/ActionL1Loss=0.0872
+ throughput/total_tokens=379,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1980/500000]
+ optim/total_grad_norm=8.853
+ train/ActionL1Loss=0.0797
+ throughput/total_tokens=380,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1981/500000]
+ train/ActionL1Loss=0.0860
+ throughput/total_tokens=380,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1982/500000]
+ train/ActionL1Loss=0.0685
+ throughput/total_tokens=380,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1983/500000]
+ train/ActionL1Loss=0.1069
+ throughput/total_tokens=380,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1984/500000]
+ train/ActionL1Loss=0.0830
+ throughput/total_tokens=380,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=1985/500000]
+ train/ActionL1Loss=0.0849
+ throughput/total_tokens=381,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1986/500000]
+ train/ActionL1Loss=0.0844
+ throughput/total_tokens=381,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1987/500000]
+ train/ActionL1Loss=0.0903
+ throughput/total_tokens=381,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1988/500000]
+ train/ActionL1Loss=0.0811
+ throughput/total_tokens=381,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1989/500000]
+ train/ActionL1Loss=0.0862
+ throughput/total_tokens=381,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1990/500000]
+ train/ActionL1Loss=0.1061
+ throughput/total_tokens=382,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=1991/500000]
+ train/ActionL1Loss=0.0742
+ throughput/total_tokens=382,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1992/500000]
+ train/ActionL1Loss=0.0774
+ throughput/total_tokens=382,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1993/500000]
+ train/ActionL1Loss=0.0821
+ throughput/total_tokens=382,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=1994/500000]
+ train/ActionL1Loss=0.0821
+ throughput/total_tokens=382,848,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1995/500000]
+ train/ActionL1Loss=0.0863
+ throughput/total_tokens=383,040,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1996/500000]
+ train/ActionL1Loss=0.0757
+ throughput/total_tokens=383,232,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1997/500000]
+ train/ActionL1Loss=0.0895
+ throughput/total_tokens=383,424,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=1998/500000]
+ train/ActionL1Loss=0.1009
+ throughput/total_tokens=383,616,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=1999/500000]
+ train/ActionL1Loss=0.0776
+ throughput/total_tokens=383,808,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=2000/500000]
+ optim/total_grad_norm=9.144
+ train/ActionL1Loss=0.0683
+ throughput/total_tokens=384,000,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/03 [04:09:30] INFO | >> Saving config... checkpoint.py:608
+10/03 [04:10:30] INFO | >> Saving model state... checkpoint.py:796
+10/03 [04:11:41] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [04:13:10] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2001/500000]
+ train/ActionL1Loss=0.0826
+ throughput/total_tokens=384,192,000
+ throughput/device/tokens_per_second=1,223
+ throughput/device/batches_per_second=0.0510
+[step=2002/500000]
+ train/ActionL1Loss=0.0688
+ throughput/total_tokens=384,384,000
+ throughput/device/tokens_per_second=1,203
+ throughput/device/batches_per_second=0.0502
+[step=2003/500000]
+ train/ActionL1Loss=0.0687
+ throughput/total_tokens=384,576,000
+ throughput/device/tokens_per_second=1,194
+ throughput/device/batches_per_second=0.0498
+[step=2004/500000]
+ train/ActionL1Loss=0.0748
+ throughput/total_tokens=384,768,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0496
+[step=2005/500000]
+ train/ActionL1Loss=0.0701
+ throughput/total_tokens=384,960,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=2006/500000]
+ train/ActionL1Loss=0.0870
+ throughput/total_tokens=385,152,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=2007/500000]
+ train/ActionL1Loss=0.0611
+ throughput/total_tokens=385,344,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=2008/500000]
+ train/ActionL1Loss=0.0833
+ throughput/total_tokens=385,536,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=2009/500000]
+ train/ActionL1Loss=0.0711
+ throughput/total_tokens=385,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2010/500000]
+ train/ActionL1Loss=0.0870
+ throughput/total_tokens=385,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2011/500000]
+ train/ActionL1Loss=0.0780
+ throughput/total_tokens=386,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2012/500000]
+ train/ActionL1Loss=0.0808
+ throughput/total_tokens=386,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2013/500000]
+ train/ActionL1Loss=0.0624
+ throughput/total_tokens=386,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2014/500000]
+ train/ActionL1Loss=0.0790
+ throughput/total_tokens=386,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2015/500000]
+ train/ActionL1Loss=0.0734
+ throughput/total_tokens=386,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2016/500000]
+ train/ActionL1Loss=0.0869
+ throughput/total_tokens=387,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2017/500000]
+ train/ActionL1Loss=0.0628
+ throughput/total_tokens=387,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2018/500000]
+ train/ActionL1Loss=0.0904
+ throughput/total_tokens=387,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2019/500000]
+ train/ActionL1Loss=0.0768
+ throughput/total_tokens=387,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2020/500000]
+ optim/total_grad_norm=10.56
+ train/ActionL1Loss=0.0712
+ throughput/total_tokens=387,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2021/500000]
+ train/ActionL1Loss=0.0748
+ throughput/total_tokens=388,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2022/500000]
+ train/ActionL1Loss=0.0898
+ throughput/total_tokens=388,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2023/500000]
+ train/ActionL1Loss=0.0809
+ throughput/total_tokens=388,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2024/500000]
+ train/ActionL1Loss=0.0939
+ throughput/total_tokens=388,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2025/500000]
+ train/ActionL1Loss=0.0727
+ throughput/total_tokens=388,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2026/500000]
+ train/ActionL1Loss=0.1031
+ throughput/total_tokens=388,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2027/500000]
+ train/ActionL1Loss=0.0915
+ throughput/total_tokens=389,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2028/500000]
+ train/ActionL1Loss=0.0780
+ throughput/total_tokens=389,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2029/500000]
+ train/ActionL1Loss=0.1342
+ throughput/total_tokens=389,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2030/500000]
+ train/ActionL1Loss=0.0646
+ throughput/total_tokens=389,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2031/500000]
+ train/ActionL1Loss=0.0671
+ throughput/total_tokens=389,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2032/500000]
+ train/ActionL1Loss=0.0723
+ throughput/total_tokens=390,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2033/500000]
+ train/ActionL1Loss=0.0761
+ throughput/total_tokens=390,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2034/500000]
+ train/ActionL1Loss=0.0729
+ throughput/total_tokens=390,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2035/500000]
+ train/ActionL1Loss=0.0949
+ throughput/total_tokens=390,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2036/500000]
+ train/ActionL1Loss=0.0732
+ throughput/total_tokens=390,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2037/500000]
+ train/ActionL1Loss=0.0817
+ throughput/total_tokens=391,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2038/500000]
+ train/ActionL1Loss=0.0952
+ throughput/total_tokens=391,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2039/500000]
+ train/ActionL1Loss=0.0773
+ throughput/total_tokens=391,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2040/500000]
+ optim/total_grad_norm=10.20
+ train/ActionL1Loss=0.1016
+ throughput/total_tokens=391,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2041/500000]
+ train/ActionL1Loss=0.0702
+ throughput/total_tokens=391,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2042/500000]
+ train/ActionL1Loss=0.1288
+ throughput/total_tokens=392,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2043/500000]
+ train/ActionL1Loss=0.0888
+ throughput/total_tokens=392,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2044/500000]
+ train/ActionL1Loss=0.0801
+ throughput/total_tokens=392,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2045/500000]
+ train/ActionL1Loss=0.0786
+ throughput/total_tokens=392,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2046/500000]
+ train/ActionL1Loss=0.0853
+ throughput/total_tokens=392,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2047/500000]
+ train/ActionL1Loss=0.0833
+ throughput/total_tokens=393,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2048/500000]
+ train/ActionL1Loss=0.0970
+ throughput/total_tokens=393,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2049/500000]
+ train/ActionL1Loss=0.0945
+ throughput/total_tokens=393,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2050/500000]
+ train/ActionL1Loss=0.0810
+ throughput/total_tokens=393,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2051/500000]
+ train/ActionL1Loss=0.0671
+ throughput/total_tokens=393,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2052/500000]
+ train/ActionL1Loss=0.0911
+ throughput/total_tokens=393,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2053/500000]
+ train/ActionL1Loss=0.0757
+ throughput/total_tokens=394,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2054/500000]
+ train/ActionL1Loss=0.0771
+ throughput/total_tokens=394,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2055/500000]
+ train/ActionL1Loss=0.0821
+ throughput/total_tokens=394,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2056/500000]
+ train/ActionL1Loss=0.0876
+ throughput/total_tokens=394,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2057/500000]
+ train/ActionL1Loss=0.0947
+ throughput/total_tokens=394,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2058/500000]
+ train/ActionL1Loss=0.0940
+ throughput/total_tokens=395,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2059/500000]
+ train/ActionL1Loss=0.0967
+ throughput/total_tokens=395,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2060/500000]
+ optim/total_grad_norm=10.00
+ train/ActionL1Loss=0.0827
+ throughput/total_tokens=395,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=2061/500000]
+ train/ActionL1Loss=0.0862
+ throughput/total_tokens=395,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2062/500000]
+ train/ActionL1Loss=0.0934
+ throughput/total_tokens=395,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2063/500000]
+ train/ActionL1Loss=0.0777
+ throughput/total_tokens=396,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2064/500000]
+ train/ActionL1Loss=0.0687
+ throughput/total_tokens=396,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2065/500000]
+ train/ActionL1Loss=0.0742
+ throughput/total_tokens=396,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2066/500000]
+ train/ActionL1Loss=0.0930
+ throughput/total_tokens=396,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2067/500000]
+ train/ActionL1Loss=0.0820
+ throughput/total_tokens=396,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2068/500000]
+ train/ActionL1Loss=0.0788
+ throughput/total_tokens=397,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2069/500000]
+ train/ActionL1Loss=0.0922
+ throughput/total_tokens=397,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2070/500000]
+ train/ActionL1Loss=0.0732
+ throughput/total_tokens=397,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2071/500000]
+ train/ActionL1Loss=0.0845
+ throughput/total_tokens=397,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2072/500000]
+ train/ActionL1Loss=0.0912
+ throughput/total_tokens=397,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2073/500000]
+ train/ActionL1Loss=0.0755
+ throughput/total_tokens=398,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2074/500000]
+ train/ActionL1Loss=0.0749
+ throughput/total_tokens=398,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2075/500000]
+ train/ActionL1Loss=0.0660
+ throughput/total_tokens=398,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2076/500000]
+ train/ActionL1Loss=0.0733
+ throughput/total_tokens=398,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2077/500000]
+ train/ActionL1Loss=0.0867
+ throughput/total_tokens=398,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2078/500000]
+ train/ActionL1Loss=0.0659
+ throughput/total_tokens=398,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2079/500000]
+ train/ActionL1Loss=0.0765
+ throughput/total_tokens=399,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2080/500000]
+ optim/total_grad_norm=8.299
+ train/ActionL1Loss=0.0910
+ throughput/total_tokens=399,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2081/500000]
+ train/ActionL1Loss=0.0698
+ throughput/total_tokens=399,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2082/500000]
+ train/ActionL1Loss=0.0702
+ throughput/total_tokens=399,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2083/500000]
+ train/ActionL1Loss=0.0711
+ throughput/total_tokens=399,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2084/500000]
+ train/ActionL1Loss=0.0726
+ throughput/total_tokens=400,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2085/500000]
+ train/ActionL1Loss=0.0687
+ throughput/total_tokens=400,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2086/500000]
+ train/ActionL1Loss=0.0688
+ throughput/total_tokens=400,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2087/500000]
+ train/ActionL1Loss=0.0859
+ throughput/total_tokens=400,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2088/500000]
+ train/ActionL1Loss=0.0671
+ throughput/total_tokens=400,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2089/500000]
+ train/ActionL1Loss=0.0814
+ throughput/total_tokens=401,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2090/500000]
+ train/ActionL1Loss=0.0682
+ throughput/total_tokens=401,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2091/500000]
+ train/ActionL1Loss=0.0785
+ throughput/total_tokens=401,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2092/500000]
+ train/ActionL1Loss=0.0736
+ throughput/total_tokens=401,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2093/500000]
+ train/ActionL1Loss=0.0811
+ throughput/total_tokens=401,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2094/500000]
+ train/ActionL1Loss=0.0627
+ throughput/total_tokens=402,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2095/500000]
+ train/ActionL1Loss=0.0648
+ throughput/total_tokens=402,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2096/500000]
+ train/ActionL1Loss=0.0664
+ throughput/total_tokens=402,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2097/500000]
+ train/ActionL1Loss=0.0707
+ throughput/total_tokens=402,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2098/500000]
+ train/ActionL1Loss=0.0788
+ throughput/total_tokens=402,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2099/500000]
+ train/ActionL1Loss=0.0753
+ throughput/total_tokens=403,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2100/500000]
+ optim/total_grad_norm=8.204
+ train/ActionL1Loss=0.0725
+ throughput/total_tokens=403,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2101/500000]
+ train/ActionL1Loss=0.0737
+ throughput/total_tokens=403,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2102/500000]
+ train/ActionL1Loss=0.0733
+ throughput/total_tokens=403,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2103/500000]
+ train/ActionL1Loss=0.0881
+ throughput/total_tokens=403,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2104/500000]
+ train/ActionL1Loss=0.0659
+ throughput/total_tokens=403,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2105/500000]
+ train/ActionL1Loss=0.0653
+ throughput/total_tokens=404,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2106/500000]
+ train/ActionL1Loss=0.0770
+ throughput/total_tokens=404,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2107/500000]
+ train/ActionL1Loss=0.0713
+ throughput/total_tokens=404,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2108/500000]
+ train/ActionL1Loss=0.0758
+ throughput/total_tokens=404,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2109/500000]
+ train/ActionL1Loss=0.0882
+ throughput/total_tokens=404,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2110/500000]
+ train/ActionL1Loss=0.0827
+ throughput/total_tokens=405,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2111/500000]
+ train/ActionL1Loss=0.0867
+ throughput/total_tokens=405,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2112/500000]
+ train/ActionL1Loss=0.0906
+ throughput/total_tokens=405,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2113/500000]
+ train/ActionL1Loss=0.0763
+ throughput/total_tokens=405,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2114/500000]
+ train/ActionL1Loss=0.1145
+ throughput/total_tokens=405,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2115/500000]
+ train/ActionL1Loss=0.0935
+ throughput/total_tokens=406,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2116/500000]
+ train/ActionL1Loss=0.1007
+ throughput/total_tokens=406,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2117/500000]
+ train/ActionL1Loss=0.0844
+ throughput/total_tokens=406,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2118/500000]
+ train/ActionL1Loss=0.0816
+ throughput/total_tokens=406,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2119/500000]
+ train/ActionL1Loss=0.1241
+ throughput/total_tokens=406,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2120/500000]
+ optim/total_grad_norm=9.198
+ train/ActionL1Loss=0.0905
+ throughput/total_tokens=407,040,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2121/500000]
+ train/ActionL1Loss=0.0988
+ throughput/total_tokens=407,232,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=2122/500000]
+ train/ActionL1Loss=0.0923
+ throughput/total_tokens=407,424,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=2123/500000]
+ train/ActionL1Loss=0.0990
+ throughput/total_tokens=407,616,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=2124/500000]
+ train/ActionL1Loss=0.1122
+ throughput/total_tokens=407,808,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=2125/500000]
+ train/ActionL1Loss=0.0875
+ throughput/total_tokens=408,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2126/500000]
+ train/ActionL1Loss=0.1042
+ throughput/total_tokens=408,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2127/500000]
+ train/ActionL1Loss=0.0995
+ throughput/total_tokens=408,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2128/500000]
+ train/ActionL1Loss=0.0887
+ throughput/total_tokens=408,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2129/500000]
+ train/ActionL1Loss=0.0841
+ throughput/total_tokens=408,768,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2130/500000]
+ train/ActionL1Loss=0.0825
+ throughput/total_tokens=408,960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2131/500000]
+ train/ActionL1Loss=0.0695
+ throughput/total_tokens=409,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2132/500000]
+ train/ActionL1Loss=0.0759
+ throughput/total_tokens=409,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2133/500000]
+ train/ActionL1Loss=0.0790
+ throughput/total_tokens=409,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2134/500000]
+ train/ActionL1Loss=0.0765
+ throughput/total_tokens=409,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2135/500000]
+ train/ActionL1Loss=0.0670
+ throughput/total_tokens=409,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2136/500000]
+ train/ActionL1Loss=0.0876
+ throughput/total_tokens=410,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2137/500000]
+ train/ActionL1Loss=0.0824
+ throughput/total_tokens=410,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2138/500000]
+ train/ActionL1Loss=0.0727
+ throughput/total_tokens=410,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2139/500000]
+ train/ActionL1Loss=0.0994
+ throughput/total_tokens=410,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2140/500000]
+ optim/total_grad_norm=8.154
+ train/ActionL1Loss=0.0963
+ throughput/total_tokens=410,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2141/500000]
+ train/ActionL1Loss=0.0818
+ throughput/total_tokens=411,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2142/500000]
+ train/ActionL1Loss=0.0884
+ throughput/total_tokens=411,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2143/500000]
+ train/ActionL1Loss=0.0856
+ throughput/total_tokens=411,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2144/500000]
+ train/ActionL1Loss=0.0792
+ throughput/total_tokens=411,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2145/500000]
+ train/ActionL1Loss=0.0833
+ throughput/total_tokens=411,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2146/500000]
+ train/ActionL1Loss=0.0737
+ throughput/total_tokens=412,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2147/500000]
+ train/ActionL1Loss=0.0624
+ throughput/total_tokens=412,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2148/500000]
+ train/ActionL1Loss=0.0764
+ throughput/total_tokens=412,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2149/500000]
+ train/ActionL1Loss=0.0685
+ throughput/total_tokens=412,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2150/500000]
+ train/ActionL1Loss=0.0667
+ throughput/total_tokens=412,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2151/500000]
+ train/ActionL1Loss=0.0675
+ throughput/total_tokens=412,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2152/500000]
+ train/ActionL1Loss=0.0637
+ throughput/total_tokens=413,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2153/500000]
+ train/ActionL1Loss=0.0600
+ throughput/total_tokens=413,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2154/500000]
+ train/ActionL1Loss=0.0652
+ throughput/total_tokens=413,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2155/500000]
+ train/ActionL1Loss=0.0755
+ throughput/total_tokens=413,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2156/500000]
+ train/ActionL1Loss=0.0599
+ throughput/total_tokens=413,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2157/500000]
+ train/ActionL1Loss=0.0762
+ throughput/total_tokens=414,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2158/500000]
+ train/ActionL1Loss=0.0706
+ throughput/total_tokens=414,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2159/500000]
+ train/ActionL1Loss=0.0787
+ throughput/total_tokens=414,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2160/500000]
+ optim/total_grad_norm=9.539
+ train/ActionL1Loss=0.0721
+ throughput/total_tokens=414,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2161/500000]
+ train/ActionL1Loss=0.0921
+ throughput/total_tokens=414,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2162/500000]
+ train/ActionL1Loss=0.0804
+ throughput/total_tokens=415,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2163/500000]
+ train/ActionL1Loss=0.0856
+ throughput/total_tokens=415,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2164/500000]
+ train/ActionL1Loss=0.0750
+ throughput/total_tokens=415,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2165/500000]
+ train/ActionL1Loss=0.0768
+ throughput/total_tokens=415,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2166/500000]
+ train/ActionL1Loss=0.0714
+ throughput/total_tokens=415,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2167/500000]
+ train/ActionL1Loss=0.0679
+ throughput/total_tokens=416,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2168/500000]
+ train/ActionL1Loss=0.0775
+ throughput/total_tokens=416,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2169/500000]
+ train/ActionL1Loss=0.0723
+ throughput/total_tokens=416,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2170/500000]
+ train/ActionL1Loss=0.0818
+ throughput/total_tokens=416,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2171/500000]
+ train/ActionL1Loss=0.0620
+ throughput/total_tokens=416,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2172/500000]
+ train/ActionL1Loss=0.0700
+ throughput/total_tokens=417,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2173/500000]
+ train/ActionL1Loss=0.0731
+ throughput/total_tokens=417,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2174/500000]
+ train/ActionL1Loss=0.0891
+ throughput/total_tokens=417,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2175/500000]
+ train/ActionL1Loss=0.0667
+ throughput/total_tokens=417,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2176/500000]
+ train/ActionL1Loss=0.0718
+ throughput/total_tokens=417,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2177/500000]
+ train/ActionL1Loss=0.0770
+ throughput/total_tokens=417,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2178/500000]
+ train/ActionL1Loss=0.0866
+ throughput/total_tokens=418,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2179/500000]
+ train/ActionL1Loss=0.0776
+ throughput/total_tokens=418,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2180/500000]
+ optim/total_grad_norm=8.938
+ train/ActionL1Loss=0.0795
+ throughput/total_tokens=418,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2181/500000]
+ train/ActionL1Loss=0.0929
+ throughput/total_tokens=418,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2182/500000]
+ train/ActionL1Loss=0.0797
+ throughput/total_tokens=418,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2183/500000]
+ train/ActionL1Loss=0.0829
+ throughput/total_tokens=419,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2184/500000]
+ train/ActionL1Loss=0.0830
+ throughput/total_tokens=419,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2185/500000]
+ train/ActionL1Loss=0.0654
+ throughput/total_tokens=419,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2186/500000]
+ train/ActionL1Loss=0.0722
+ throughput/total_tokens=419,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2187/500000]
+ train/ActionL1Loss=0.0904
+ throughput/total_tokens=419,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2188/500000]
+ train/ActionL1Loss=0.0771
+ throughput/total_tokens=420,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2189/500000]
+ train/ActionL1Loss=0.0774
+ throughput/total_tokens=420,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2190/500000]
+ train/ActionL1Loss=0.0975
+ throughput/total_tokens=420,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2191/500000]
+ train/ActionL1Loss=0.0764
+ throughput/total_tokens=420,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2192/500000]
+ train/ActionL1Loss=0.0897
+ throughput/total_tokens=420,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2193/500000]
+ train/ActionL1Loss=0.0853
+ throughput/total_tokens=421,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2194/500000]
+ train/ActionL1Loss=0.1328
+ throughput/total_tokens=421,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2195/500000]
+ train/ActionL1Loss=0.0791
+ throughput/total_tokens=421,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2196/500000]
+ train/ActionL1Loss=0.0877
+ throughput/total_tokens=421,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2197/500000]
+ train/ActionL1Loss=0.0847
+ throughput/total_tokens=421,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2198/500000]
+ train/ActionL1Loss=0.0783
+ throughput/total_tokens=422,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2199/500000]
+ train/ActionL1Loss=0.0920
+ throughput/total_tokens=422,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2200/500000]
+ optim/total_grad_norm=9.934
+ train/ActionL1Loss=0.0904
+ throughput/total_tokens=422,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2201/500000]
+ train/ActionL1Loss=0.0724
+ throughput/total_tokens=422,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2202/500000]
+ train/ActionL1Loss=0.0733
+ throughput/total_tokens=422,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2203/500000]
+ train/ActionL1Loss=0.0966
+ throughput/total_tokens=422,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2204/500000]
+ train/ActionL1Loss=0.0718
+ throughput/total_tokens=423,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2205/500000]
+ train/ActionL1Loss=0.0922
+ throughput/total_tokens=423,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2206/500000]
+ train/ActionL1Loss=0.0745
+ throughput/total_tokens=423,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2207/500000]
+ train/ActionL1Loss=0.0639
+ throughput/total_tokens=423,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2208/500000]
+ train/ActionL1Loss=0.0798
+ throughput/total_tokens=423,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2209/500000]
+ train/ActionL1Loss=0.0772
+ throughput/total_tokens=424,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2210/500000]
+ train/ActionL1Loss=0.0701
+ throughput/total_tokens=424,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2211/500000]
+ train/ActionL1Loss=0.0798
+ throughput/total_tokens=424,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2212/500000]
+ train/ActionL1Loss=0.0793
+ throughput/total_tokens=424,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2213/500000]
+ train/ActionL1Loss=0.0894
+ throughput/total_tokens=424,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2214/500000]
+ train/ActionL1Loss=0.0881
+ throughput/total_tokens=425,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2215/500000]
+ train/ActionL1Loss=0.0685
+ throughput/total_tokens=425,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2216/500000]
+ train/ActionL1Loss=0.0744
+ throughput/total_tokens=425,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2217/500000]
+ train/ActionL1Loss=0.0700
+ throughput/total_tokens=425,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2218/500000]
+ train/ActionL1Loss=0.0659
+ throughput/total_tokens=425,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2219/500000]
+ train/ActionL1Loss=0.0770
+ throughput/total_tokens=426,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2220/500000]
+ optim/total_grad_norm=9.069
+ train/ActionL1Loss=0.0779
+ throughput/total_tokens=426,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2221/500000]
+ train/ActionL1Loss=0.0746
+ throughput/total_tokens=426,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2222/500000]
+ train/ActionL1Loss=0.0873
+ throughput/total_tokens=426,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2223/500000]
+ train/ActionL1Loss=0.0792
+ throughput/total_tokens=426,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2224/500000]
+ train/ActionL1Loss=0.0868
+ throughput/total_tokens=427,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2225/500000]
+ train/ActionL1Loss=0.0744
+ throughput/total_tokens=427,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2226/500000]
+ train/ActionL1Loss=0.0774
+ throughput/total_tokens=427,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2227/500000]
+ train/ActionL1Loss=0.0629
+ throughput/total_tokens=427,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2228/500000]
+ train/ActionL1Loss=0.0834
+ throughput/total_tokens=427,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2229/500000]
+ train/ActionL1Loss=0.0813
+ throughput/total_tokens=427,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2230/500000]
+ train/ActionL1Loss=0.0618
+ throughput/total_tokens=428,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2231/500000]
+ train/ActionL1Loss=0.0754
+ throughput/total_tokens=428,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2232/500000]
+ train/ActionL1Loss=0.0688
+ throughput/total_tokens=428,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2233/500000]
+ train/ActionL1Loss=0.0615
+ throughput/total_tokens=428,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2234/500000]
+ train/ActionL1Loss=0.0638
+ throughput/total_tokens=428,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2235/500000]
+ train/ActionL1Loss=0.0634
+ throughput/total_tokens=429,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2236/500000]
+ train/ActionL1Loss=0.0795
+ throughput/total_tokens=429,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2237/500000]
+ train/ActionL1Loss=0.0808
+ throughput/total_tokens=429,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2238/500000]
+ train/ActionL1Loss=0.0727
+ throughput/total_tokens=429,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2239/500000]
+ train/ActionL1Loss=0.0756
+ throughput/total_tokens=429,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2240/500000]
+ optim/total_grad_norm=10.12
+ train/ActionL1Loss=0.0822
+ throughput/total_tokens=430,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2241/500000]
+ train/ActionL1Loss=0.0757
+ throughput/total_tokens=430,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2242/500000]
+ train/ActionL1Loss=0.0769
+ throughput/total_tokens=430,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2243/500000]
+ train/ActionL1Loss=0.0752
+ throughput/total_tokens=430,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2244/500000]
+ train/ActionL1Loss=0.0701
+ throughput/total_tokens=430,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2245/500000]
+ train/ActionL1Loss=0.0657
+ throughput/total_tokens=431,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2246/500000]
+ train/ActionL1Loss=0.0705
+ throughput/total_tokens=431,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2247/500000]
+ train/ActionL1Loss=0.0879
+ throughput/total_tokens=431,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2248/500000]
+ train/ActionL1Loss=0.0760
+ throughput/total_tokens=431,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2249/500000]
+ train/ActionL1Loss=0.0822
+ throughput/total_tokens=431,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2250/500000]
+ train/ActionL1Loss=0.0717
+ throughput/total_tokens=432,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2251/500000]
+ train/ActionL1Loss=0.0834
+ throughput/total_tokens=432,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2252/500000]
+ train/ActionL1Loss=0.0880
+ throughput/total_tokens=432,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2253/500000]
+ train/ActionL1Loss=0.0800
+ throughput/total_tokens=432,576,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2254/500000]
+ train/ActionL1Loss=0.0812
+ throughput/total_tokens=432,768,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2255/500000]
+ train/ActionL1Loss=0.0734
+ throughput/total_tokens=432,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2256/500000]
+ train/ActionL1Loss=0.0983
+ throughput/total_tokens=433,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2257/500000]
+ train/ActionL1Loss=0.0864
+ throughput/total_tokens=433,344,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2258/500000]
+ train/ActionL1Loss=0.0766
+ throughput/total_tokens=433,536,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2259/500000]
+ train/ActionL1Loss=0.0798
+ throughput/total_tokens=433,728,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2260/500000]
+ optim/total_grad_norm=7.544
+ train/ActionL1Loss=0.0769
+ throughput/total_tokens=433,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2261/500000]
+ train/ActionL1Loss=0.0862
+ throughput/total_tokens=434,112,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2262/500000]
+ train/ActionL1Loss=0.0946
+ throughput/total_tokens=434,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2263/500000]
+ train/ActionL1Loss=0.0736
+ throughput/total_tokens=434,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2264/500000]
+ train/ActionL1Loss=0.0901
+ throughput/total_tokens=434,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2265/500000]
+ train/ActionL1Loss=0.0860
+ throughput/total_tokens=434,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2266/500000]
+ train/ActionL1Loss=0.0816
+ throughput/total_tokens=435,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2267/500000]
+ train/ActionL1Loss=0.1059
+ throughput/total_tokens=435,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2268/500000]
+ train/ActionL1Loss=0.0708
+ throughput/total_tokens=435,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2269/500000]
+ train/ActionL1Loss=0.0659
+ throughput/total_tokens=435,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2270/500000]
+ train/ActionL1Loss=0.0781
+ throughput/total_tokens=435,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2271/500000]
+ train/ActionL1Loss=0.0877
+ throughput/total_tokens=436,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2272/500000]
+ train/ActionL1Loss=0.0646
+ throughput/total_tokens=436,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2273/500000]
+ train/ActionL1Loss=0.0549
+ throughput/total_tokens=436,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2274/500000]
+ train/ActionL1Loss=0.0811
+ throughput/total_tokens=436,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2275/500000]
+ train/ActionL1Loss=0.0858
+ throughput/total_tokens=436,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2276/500000]
+ train/ActionL1Loss=0.0823
+ throughput/total_tokens=436,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2277/500000]
+ train/ActionL1Loss=0.0859
+ throughput/total_tokens=437,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2278/500000]
+ train/ActionL1Loss=0.0665
+ throughput/total_tokens=437,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2279/500000]
+ train/ActionL1Loss=0.0667
+ throughput/total_tokens=437,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2280/500000]
+ optim/total_grad_norm=8.745
+ train/ActionL1Loss=0.0632
+ throughput/total_tokens=437,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2281/500000]
+ train/ActionL1Loss=0.0833
+ throughput/total_tokens=437,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2282/500000]
+ train/ActionL1Loss=0.0890
+ throughput/total_tokens=438,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2283/500000]
+ train/ActionL1Loss=0.0789
+ throughput/total_tokens=438,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2284/500000]
+ train/ActionL1Loss=0.0687
+ throughput/total_tokens=438,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2285/500000]
+ train/ActionL1Loss=0.0686
+ throughput/total_tokens=438,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2286/500000]
+ train/ActionL1Loss=0.0756
+ throughput/total_tokens=438,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2287/500000]
+ train/ActionL1Loss=0.0658
+ throughput/total_tokens=439,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2288/500000]
+ train/ActionL1Loss=0.0659
+ throughput/total_tokens=439,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2289/500000]
+ train/ActionL1Loss=0.0772
+ throughput/total_tokens=439,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2290/500000]
+ train/ActionL1Loss=0.0710
+ throughput/total_tokens=439,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2291/500000]
+ train/ActionL1Loss=0.0731
+ throughput/total_tokens=439,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2292/500000]
+ train/ActionL1Loss=0.0648
+ throughput/total_tokens=440,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2293/500000]
+ train/ActionL1Loss=0.0712
+ throughput/total_tokens=440,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2294/500000]
+ train/ActionL1Loss=0.0767
+ throughput/total_tokens=440,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2295/500000]
+ train/ActionL1Loss=0.0723
+ throughput/total_tokens=440,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2296/500000]
+ train/ActionL1Loss=0.0582
+ throughput/total_tokens=440,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2297/500000]
+ train/ActionL1Loss=0.0786
+ throughput/total_tokens=441,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2298/500000]
+ train/ActionL1Loss=0.0756
+ throughput/total_tokens=441,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2299/500000]
+ train/ActionL1Loss=0.0630
+ throughput/total_tokens=441,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2300/500000]
+ optim/total_grad_norm=8.065
+ train/ActionL1Loss=0.0687
+ throughput/total_tokens=441,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2301/500000]
+ train/ActionL1Loss=0.0667
+ throughput/total_tokens=441,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2302/500000]
+ train/ActionL1Loss=0.0680
+ throughput/total_tokens=441,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2303/500000]
+ train/ActionL1Loss=0.0668
+ throughput/total_tokens=442,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2304/500000]
+ train/ActionL1Loss=0.0665
+ throughput/total_tokens=442,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2305/500000]
+ train/ActionL1Loss=0.0682
+ throughput/total_tokens=442,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2306/500000]
+ train/ActionL1Loss=0.0884
+ throughput/total_tokens=442,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2307/500000]
+ train/ActionL1Loss=0.0676
+ throughput/total_tokens=442,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2308/500000]
+ train/ActionL1Loss=0.0736
+ throughput/total_tokens=443,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2309/500000]
+ train/ActionL1Loss=0.0701
+ throughput/total_tokens=443,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2310/500000]
+ train/ActionL1Loss=0.0736
+ throughput/total_tokens=443,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2311/500000]
+ train/ActionL1Loss=0.0756
+ throughput/total_tokens=443,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2312/500000]
+ train/ActionL1Loss=0.0725
+ throughput/total_tokens=443,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2313/500000]
+ train/ActionL1Loss=0.0801
+ throughput/total_tokens=444,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2314/500000]
+ train/ActionL1Loss=0.0667
+ throughput/total_tokens=444,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2315/500000]
+ train/ActionL1Loss=0.0605
+ throughput/total_tokens=444,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2316/500000]
+ train/ActionL1Loss=0.0819
+ throughput/total_tokens=444,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2317/500000]
+ train/ActionL1Loss=0.0673
+ throughput/total_tokens=444,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2318/500000]
+ train/ActionL1Loss=0.0890
+ throughput/total_tokens=445,056,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2319/500000]
+ train/ActionL1Loss=0.0712
+ throughput/total_tokens=445,248,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2320/500000]
+ optim/total_grad_norm=7.641
+ train/ActionL1Loss=0.0729
+ throughput/total_tokens=445,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2321/500000]
+ train/ActionL1Loss=0.0568
+ throughput/total_tokens=445,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2322/500000]
+ train/ActionL1Loss=0.0738
+ throughput/total_tokens=445,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2323/500000]
+ train/ActionL1Loss=0.0641
+ throughput/total_tokens=446,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2324/500000]
+ train/ActionL1Loss=0.0676
+ throughput/total_tokens=446,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2325/500000]
+ train/ActionL1Loss=0.0768
+ throughput/total_tokens=446,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2326/500000]
+ train/ActionL1Loss=0.0659
+ throughput/total_tokens=446,592,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2327/500000]
+ train/ActionL1Loss=0.0808
+ throughput/total_tokens=446,784,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2328/500000]
+ train/ActionL1Loss=0.0546
+ throughput/total_tokens=446,976,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2329/500000]
+ train/ActionL1Loss=0.0748
+ throughput/total_tokens=447,168,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2330/500000]
+ train/ActionL1Loss=0.0703
+ throughput/total_tokens=447,360,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2331/500000]
+ train/ActionL1Loss=0.0686
+ throughput/total_tokens=447,552,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2332/500000]
+ train/ActionL1Loss=0.0677
+ throughput/total_tokens=447,744,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2333/500000]
+ train/ActionL1Loss=0.0640
+ throughput/total_tokens=447,936,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2334/500000]
+ train/ActionL1Loss=0.0689
+ throughput/total_tokens=448,128,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2335/500000]
+ train/ActionL1Loss=0.0602
+ throughput/total_tokens=448,320,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2336/500000]
+ train/ActionL1Loss=0.0590
+ throughput/total_tokens=448,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2337/500000]
+ train/ActionL1Loss=0.0605
+ throughput/total_tokens=448,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2338/500000]
+ train/ActionL1Loss=0.0559
+ throughput/total_tokens=448,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2339/500000]
+ train/ActionL1Loss=0.0567
+ throughput/total_tokens=449,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2340/500000]
+ optim/total_grad_norm=9.645
+ train/ActionL1Loss=0.0614
+ throughput/total_tokens=449,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2341/500000]
+ train/ActionL1Loss=0.0566
+ throughput/total_tokens=449,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2342/500000]
+ train/ActionL1Loss=0.0540
+ throughput/total_tokens=449,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2343/500000]
+ train/ActionL1Loss=0.0631
+ throughput/total_tokens=449,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2344/500000]
+ train/ActionL1Loss=0.0753
+ throughput/total_tokens=450,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2345/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=450,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2346/500000]
+ train/ActionL1Loss=0.0666
+ throughput/total_tokens=450,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2347/500000]
+ train/ActionL1Loss=0.0626
+ throughput/total_tokens=450,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2348/500000]
+ train/ActionL1Loss=0.0561
+ throughput/total_tokens=450,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2349/500000]
+ train/ActionL1Loss=0.0624
+ throughput/total_tokens=451,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2350/500000]
+ train/ActionL1Loss=0.0734
+ throughput/total_tokens=451,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2351/500000]
+ train/ActionL1Loss=0.0809
+ throughput/total_tokens=451,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2352/500000]
+ train/ActionL1Loss=0.0693
+ throughput/total_tokens=451,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2353/500000]
+ train/ActionL1Loss=0.0752
+ throughput/total_tokens=451,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2354/500000]
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=451,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2355/500000]
+ train/ActionL1Loss=0.0646
+ throughput/total_tokens=452,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2356/500000]
+ train/ActionL1Loss=0.0676
+ throughput/total_tokens=452,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2357/500000]
+ train/ActionL1Loss=0.0597
+ throughput/total_tokens=452,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2358/500000]
+ train/ActionL1Loss=0.0510
+ throughput/total_tokens=452,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2359/500000]
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=452,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2360/500000]
+ optim/total_grad_norm=8.895
+ train/ActionL1Loss=0.0555
+ throughput/total_tokens=453,120,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2361/500000]
+ train/ActionL1Loss=0.0764
+ throughput/total_tokens=453,312,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2362/500000]
+ train/ActionL1Loss=0.0596
+ throughput/total_tokens=453,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2363/500000]
+ train/ActionL1Loss=0.0617
+ throughput/total_tokens=453,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2364/500000]
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=453,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2365/500000]
+ train/ActionL1Loss=0.0596
+ throughput/total_tokens=454,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2366/500000]
+ train/ActionL1Loss=0.0570
+ throughput/total_tokens=454,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2367/500000]
+ train/ActionL1Loss=0.0658
+ throughput/total_tokens=454,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2368/500000]
+ train/ActionL1Loss=0.0725
+ throughput/total_tokens=454,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2369/500000]
+ train/ActionL1Loss=0.0546
+ throughput/total_tokens=454,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2370/500000]
+ train/ActionL1Loss=0.0580
+ throughput/total_tokens=455,040,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=2371/500000]
+ train/ActionL1Loss=0.0594
+ throughput/total_tokens=455,232,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=2372/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=455,424,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=2373/500000]
+ train/ActionL1Loss=0.0708
+ throughput/total_tokens=455,616,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=2374/500000]
+ train/ActionL1Loss=0.0575
+ throughput/total_tokens=455,808,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=2375/500000]
+ train/ActionL1Loss=0.0616
+ throughput/total_tokens=456,000,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=2376/500000]
+ train/ActionL1Loss=0.0585
+ throughput/total_tokens=456,192,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=2377/500000]
+ train/ActionL1Loss=0.0689
+ throughput/total_tokens=456,384,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=2378/500000]
+ train/ActionL1Loss=0.0603
+ throughput/total_tokens=456,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2379/500000]
+ train/ActionL1Loss=0.0600
+ throughput/total_tokens=456,768,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2380/500000]
+ optim/total_grad_norm=10.31
+ train/ActionL1Loss=0.0828
+ throughput/total_tokens=456,960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2381/500000]
+ train/ActionL1Loss=0.0671
+ throughput/total_tokens=457,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2382/500000]
+ train/ActionL1Loss=0.0607
+ throughput/total_tokens=457,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2383/500000]
+ train/ActionL1Loss=0.0675
+ throughput/total_tokens=457,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2384/500000]
+ train/ActionL1Loss=0.0663
+ throughput/total_tokens=457,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2385/500000]
+ train/ActionL1Loss=0.0650
+ throughput/total_tokens=457,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2386/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=458,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2387/500000]
+ train/ActionL1Loss=0.0525
+ throughput/total_tokens=458,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2388/500000]
+ train/ActionL1Loss=0.0589
+ throughput/total_tokens=458,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2389/500000]
+ train/ActionL1Loss=0.0582
+ throughput/total_tokens=458,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2390/500000]
+ train/ActionL1Loss=0.0655
+ throughput/total_tokens=458,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2391/500000]
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=459,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2392/500000]
+ train/ActionL1Loss=0.0545
+ throughput/total_tokens=459,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2393/500000]
+ train/ActionL1Loss=0.0555
+ throughput/total_tokens=459,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2394/500000]
+ train/ActionL1Loss=0.0660
+ throughput/total_tokens=459,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2395/500000]
+ train/ActionL1Loss=0.0552
+ throughput/total_tokens=459,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2396/500000]
+ train/ActionL1Loss=0.0506
+ throughput/total_tokens=460,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2397/500000]
+ train/ActionL1Loss=0.0562
+ throughput/total_tokens=460,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2398/500000]
+ train/ActionL1Loss=0.0600
+ throughput/total_tokens=460,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2399/500000]
+ train/ActionL1Loss=0.0597
+ throughput/total_tokens=460,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2400/500000]
+ optim/total_grad_norm=10.71
+ train/ActionL1Loss=0.0758
+ throughput/total_tokens=460,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2401/500000]
+ train/ActionL1Loss=0.0524
+ throughput/total_tokens=460,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2402/500000]
+ train/ActionL1Loss=0.0667
+ throughput/total_tokens=461,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2403/500000]
+ train/ActionL1Loss=0.0720
+ throughput/total_tokens=461,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2404/500000]
+ train/ActionL1Loss=0.0815
+ throughput/total_tokens=461,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2405/500000]
+ train/ActionL1Loss=0.0652
+ throughput/total_tokens=461,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2406/500000]
+ train/ActionL1Loss=0.0608
+ throughput/total_tokens=461,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2407/500000]
+ train/ActionL1Loss=0.0718
+ throughput/total_tokens=462,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2408/500000]
+ train/ActionL1Loss=0.0710
+ throughput/total_tokens=462,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2409/500000]
+ train/ActionL1Loss=0.0595
+ throughput/total_tokens=462,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2410/500000]
+ train/ActionL1Loss=0.0697
+ throughput/total_tokens=462,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=2411/500000]
+ train/ActionL1Loss=0.0638
+ throughput/total_tokens=462,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2412/500000]
+ train/ActionL1Loss=0.0631
+ throughput/total_tokens=463,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2413/500000]
+ train/ActionL1Loss=0.0700
+ throughput/total_tokens=463,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2414/500000]
+ train/ActionL1Loss=0.0602
+ throughput/total_tokens=463,488,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2415/500000]
+ train/ActionL1Loss=0.0603
+ throughput/total_tokens=463,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2416/500000]
+ train/ActionL1Loss=0.0687
+ throughput/total_tokens=463,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2417/500000]
+ train/ActionL1Loss=0.0631
+ throughput/total_tokens=464,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2418/500000]
+ train/ActionL1Loss=0.0631
+ throughput/total_tokens=464,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2419/500000]
+ train/ActionL1Loss=0.0694
+ throughput/total_tokens=464,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2420/500000]
+ optim/total_grad_norm=9.331
+ train/ActionL1Loss=0.0626
+ throughput/total_tokens=464,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2421/500000]
+ train/ActionL1Loss=0.0612
+ throughput/total_tokens=464,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2422/500000]
+ train/ActionL1Loss=0.0682
+ throughput/total_tokens=465,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2423/500000]
+ train/ActionL1Loss=0.0639
+ throughput/total_tokens=465,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2424/500000]
+ train/ActionL1Loss=0.0663
+ throughput/total_tokens=465,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2425/500000]
+ train/ActionL1Loss=0.0597
+ throughput/total_tokens=465,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2426/500000]
+ train/ActionL1Loss=0.0613
+ throughput/total_tokens=465,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2427/500000]
+ train/ActionL1Loss=0.0733
+ throughput/total_tokens=465,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2428/500000]
+ train/ActionL1Loss=0.0663
+ throughput/total_tokens=466,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2429/500000]
+ train/ActionL1Loss=0.0549
+ throughput/total_tokens=466,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2430/500000]
+ train/ActionL1Loss=0.0550
+ throughput/total_tokens=466,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2431/500000]
+ train/ActionL1Loss=0.0639
+ throughput/total_tokens=466,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2432/500000]
+ train/ActionL1Loss=0.0746
+ throughput/total_tokens=466,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2433/500000]
+ train/ActionL1Loss=0.0638
+ throughput/total_tokens=467,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2434/500000]
+ train/ActionL1Loss=0.0657
+ throughput/total_tokens=467,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2435/500000]
+ train/ActionL1Loss=0.0683
+ throughput/total_tokens=467,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2436/500000]
+ train/ActionL1Loss=0.0574
+ throughput/total_tokens=467,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2437/500000]
+ train/ActionL1Loss=0.0619
+ throughput/total_tokens=467,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2438/500000]
+ train/ActionL1Loss=0.0601
+ throughput/total_tokens=468,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2439/500000]
+ train/ActionL1Loss=0.0562
+ throughput/total_tokens=468,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2440/500000]
+ optim/total_grad_norm=8.143
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=468,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2441/500000]
+ train/ActionL1Loss=0.0544
+ throughput/total_tokens=468,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2442/500000]
+ train/ActionL1Loss=0.0618
+ throughput/total_tokens=468,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2443/500000]
+ train/ActionL1Loss=0.0499
+ throughput/total_tokens=469,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2444/500000]
+ train/ActionL1Loss=0.0634
+ throughput/total_tokens=469,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2445/500000]
+ train/ActionL1Loss=0.0540
+ throughput/total_tokens=469,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2446/500000]
+ train/ActionL1Loss=0.0608
+ throughput/total_tokens=469,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2447/500000]
+ train/ActionL1Loss=0.0493
+ throughput/total_tokens=469,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2448/500000]
+ train/ActionL1Loss=0.0555
+ throughput/total_tokens=470,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2449/500000]
+ train/ActionL1Loss=0.0617
+ throughput/total_tokens=470,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2450/500000]
+ train/ActionL1Loss=0.0485
+ throughput/total_tokens=470,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2451/500000]
+ train/ActionL1Loss=0.0507
+ throughput/total_tokens=470,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2452/500000]
+ train/ActionL1Loss=0.0622
+ throughput/total_tokens=470,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2453/500000]
+ train/ActionL1Loss=0.0540
+ throughput/total_tokens=470,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2454/500000]
+ train/ActionL1Loss=0.0519
+ throughput/total_tokens=471,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2455/500000]
+ train/ActionL1Loss=0.0619
+ throughput/total_tokens=471,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2456/500000]
+ train/ActionL1Loss=0.0719
+ throughput/total_tokens=471,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2457/500000]
+ train/ActionL1Loss=0.0781
+ throughput/total_tokens=471,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2458/500000]
+ train/ActionL1Loss=0.0542
+ throughput/total_tokens=471,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2459/500000]
+ train/ActionL1Loss=0.0485
+ throughput/total_tokens=472,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2460/500000]
+ optim/total_grad_norm=9.239
+ train/ActionL1Loss=0.0717
+ throughput/total_tokens=472,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=2461/500000]
+ train/ActionL1Loss=0.0616
+ throughput/total_tokens=472,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2462/500000]
+ train/ActionL1Loss=0.0578
+ throughput/total_tokens=472,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2463/500000]
+ train/ActionL1Loss=0.0432
+ throughput/total_tokens=472,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2464/500000]
+ train/ActionL1Loss=0.0527
+ throughput/total_tokens=473,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2465/500000]
+ train/ActionL1Loss=0.0570
+ throughput/total_tokens=473,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2466/500000]
+ train/ActionL1Loss=0.0562
+ throughput/total_tokens=473,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2467/500000]
+ train/ActionL1Loss=0.0539
+ throughput/total_tokens=473,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2468/500000]
+ train/ActionL1Loss=0.0477
+ throughput/total_tokens=473,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2469/500000]
+ train/ActionL1Loss=0.0674
+ throughput/total_tokens=474,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2470/500000]
+ train/ActionL1Loss=0.0770
+ throughput/total_tokens=474,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2471/500000]
+ train/ActionL1Loss=0.0615
+ throughput/total_tokens=474,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2472/500000]
+ train/ActionL1Loss=0.0623
+ throughput/total_tokens=474,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2473/500000]
+ train/ActionL1Loss=0.0599
+ throughput/total_tokens=474,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2474/500000]
+ train/ActionL1Loss=0.0638
+ throughput/total_tokens=475,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2475/500000]
+ train/ActionL1Loss=0.0488
+ throughput/total_tokens=475,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2476/500000]
+ train/ActionL1Loss=0.0625
+ throughput/total_tokens=475,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2477/500000]
+ train/ActionL1Loss=0.0699
+ throughput/total_tokens=475,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2478/500000]
+ train/ActionL1Loss=0.0631
+ throughput/total_tokens=475,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2479/500000]
+ train/ActionL1Loss=0.0718
+ throughput/total_tokens=475,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2480/500000]
+ optim/total_grad_norm=10.97
+ train/ActionL1Loss=0.0533
+ throughput/total_tokens=476,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2481/500000]
+ train/ActionL1Loss=0.0657
+ throughput/total_tokens=476,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2482/500000]
+ train/ActionL1Loss=0.0518
+ throughput/total_tokens=476,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2483/500000]
+ train/ActionL1Loss=0.0763
+ throughput/total_tokens=476,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2484/500000]
+ train/ActionL1Loss=0.0627
+ throughput/total_tokens=476,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2485/500000]
+ train/ActionL1Loss=0.0580
+ throughput/total_tokens=477,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2486/500000]
+ train/ActionL1Loss=0.0524
+ throughput/total_tokens=477,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2487/500000]
+ train/ActionL1Loss=0.0537
+ throughput/total_tokens=477,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2488/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=477,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2489/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=477,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2490/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=478,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2491/500000]
+ train/ActionL1Loss=0.0666
+ throughput/total_tokens=478,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2492/500000]
+ train/ActionL1Loss=0.0612
+ throughput/total_tokens=478,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2493/500000]
+ train/ActionL1Loss=0.0587
+ throughput/total_tokens=478,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2494/500000]
+ train/ActionL1Loss=0.0563
+ throughput/total_tokens=478,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2495/500000]
+ train/ActionL1Loss=0.0615
+ throughput/total_tokens=479,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2496/500000]
+ train/ActionL1Loss=0.0827
+ throughput/total_tokens=479,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2497/500000]
+ train/ActionL1Loss=0.0593
+ throughput/total_tokens=479,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2498/500000]
+ train/ActionL1Loss=0.0588
+ throughput/total_tokens=479,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2499/500000]
+ train/ActionL1Loss=0.0620
+ throughput/total_tokens=479,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2500/500000]
+ optim/total_grad_norm=7.997
+ train/ActionL1Loss=0.0648
+ throughput/total_tokens=480,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/03 [07:03:28] INFO | >> Saving config... checkpoint.py:608
+10/03 [07:04:04] INFO | >> Saving model state... checkpoint.py:796
+10/03 [07:05:14] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [07:06:44] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2501/500000]
+ train/ActionL1Loss=0.0594
+ throughput/total_tokens=480,192,000
+ throughput/device/tokens_per_second=1,220
+ throughput/device/batches_per_second=0.0509
+[step=2502/500000]
+ train/ActionL1Loss=0.0699
+ throughput/total_tokens=480,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2503/500000]
+ train/ActionL1Loss=0.0768
+ throughput/total_tokens=480,576,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=2504/500000]
+ train/ActionL1Loss=0.0672
+ throughput/total_tokens=480,768,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=2505/500000]
+ train/ActionL1Loss=0.0636
+ throughput/total_tokens=480,960,000
+ throughput/device/tokens_per_second=1,164
+ throughput/device/batches_per_second=0.0485
+[step=2506/500000]
+ train/ActionL1Loss=0.0631
+ throughput/total_tokens=481,152,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=2507/500000]
+ train/ActionL1Loss=0.0608
+ throughput/total_tokens=481,344,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=2508/500000]
+ train/ActionL1Loss=0.0677
+ throughput/total_tokens=481,536,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=2509/500000]
+ train/ActionL1Loss=0.0660
+ throughput/total_tokens=481,728,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=2510/500000]
+ train/ActionL1Loss=0.0695
+ throughput/total_tokens=481,920,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+ System/Peak GPU Memory (MB)=46,917
+[step=2511/500000]
+ train/ActionL1Loss=0.0603
+ throughput/total_tokens=482,112,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=2512/500000]
+ train/ActionL1Loss=0.0578
+ throughput/total_tokens=482,304,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=2513/500000]
+ train/ActionL1Loss=0.0581
+ throughput/total_tokens=482,496,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=2514/500000]
+ train/ActionL1Loss=0.0672
+ throughput/total_tokens=482,688,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=2515/500000]
+ train/ActionL1Loss=0.0686
+ throughput/total_tokens=482,880,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=2516/500000]
+ train/ActionL1Loss=0.0755
+ throughput/total_tokens=483,072,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=2517/500000]
+ train/ActionL1Loss=0.0714
+ throughput/total_tokens=483,264,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=2518/500000]
+ train/ActionL1Loss=0.0683
+ throughput/total_tokens=483,456,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=2519/500000]
+ train/ActionL1Loss=0.0638
+ throughput/total_tokens=483,648,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=2520/500000]
+ optim/total_grad_norm=9.595
+ train/ActionL1Loss=0.0586
+ throughput/total_tokens=483,840,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=2521/500000]
+ train/ActionL1Loss=0.0787
+ throughput/total_tokens=484,032,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=2522/500000]
+ train/ActionL1Loss=0.0814
+ throughput/total_tokens=484,224,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=2523/500000]
+ train/ActionL1Loss=0.0548
+ throughput/total_tokens=484,416,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2524/500000]
+ train/ActionL1Loss=0.0641
+ throughput/total_tokens=484,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2525/500000]
+ train/ActionL1Loss=0.0692
+ throughput/total_tokens=484,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2526/500000]
+ train/ActionL1Loss=0.0646
+ throughput/total_tokens=484,992,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2527/500000]
+ train/ActionL1Loss=0.0594
+ throughput/total_tokens=485,184,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2528/500000]
+ train/ActionL1Loss=0.0606
+ throughput/total_tokens=485,376,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2529/500000]
+ train/ActionL1Loss=0.0732
+ throughput/total_tokens=485,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2530/500000]
+ train/ActionL1Loss=0.0766
+ throughput/total_tokens=485,760,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2531/500000]
+ train/ActionL1Loss=0.0705
+ throughput/total_tokens=485,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2532/500000]
+ train/ActionL1Loss=0.0531
+ throughput/total_tokens=486,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2533/500000]
+ train/ActionL1Loss=0.0519
+ throughput/total_tokens=486,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2534/500000]
+ train/ActionL1Loss=0.0808
+ throughput/total_tokens=486,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2535/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=486,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2536/500000]
+ train/ActionL1Loss=0.0584
+ throughput/total_tokens=486,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2537/500000]
+ train/ActionL1Loss=0.0746
+ throughput/total_tokens=487,104,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2538/500000]
+ train/ActionL1Loss=0.0612
+ throughput/total_tokens=487,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2539/500000]
+ train/ActionL1Loss=0.0640
+ throughput/total_tokens=487,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2540/500000]
+ optim/total_grad_norm=6.890
+ train/ActionL1Loss=0.0590
+ throughput/total_tokens=487,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2541/500000]
+ train/ActionL1Loss=0.0569
+ throughput/total_tokens=487,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2542/500000]
+ train/ActionL1Loss=0.0759
+ throughput/total_tokens=488,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2543/500000]
+ train/ActionL1Loss=0.0607
+ throughput/total_tokens=488,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2544/500000]
+ train/ActionL1Loss=0.0588
+ throughput/total_tokens=488,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2545/500000]
+ train/ActionL1Loss=0.0654
+ throughput/total_tokens=488,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2546/500000]
+ train/ActionL1Loss=0.0703
+ throughput/total_tokens=488,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2547/500000]
+ train/ActionL1Loss=0.0544
+ throughput/total_tokens=489,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2548/500000]
+ train/ActionL1Loss=0.0666
+ throughput/total_tokens=489,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2549/500000]
+ train/ActionL1Loss=0.0580
+ throughput/total_tokens=489,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2550/500000]
+ train/ActionL1Loss=0.0463
+ throughput/total_tokens=489,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2551/500000]
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=489,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2552/500000]
+ train/ActionL1Loss=0.0688
+ throughput/total_tokens=489,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2553/500000]
+ train/ActionL1Loss=0.0786
+ throughput/total_tokens=490,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2554/500000]
+ train/ActionL1Loss=0.0834
+ throughput/total_tokens=490,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2555/500000]
+ train/ActionL1Loss=0.0608
+ throughput/total_tokens=490,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2556/500000]
+ train/ActionL1Loss=0.0634
+ throughput/total_tokens=490,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2557/500000]
+ train/ActionL1Loss=0.0787
+ throughput/total_tokens=490,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2558/500000]
+ train/ActionL1Loss=0.0596
+ throughput/total_tokens=491,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2559/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=491,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2560/500000]
+ optim/total_grad_norm=10.11
+ train/ActionL1Loss=0.0668
+ throughput/total_tokens=491,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2561/500000]
+ train/ActionL1Loss=0.0868
+ throughput/total_tokens=491,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2562/500000]
+ train/ActionL1Loss=0.0711
+ throughput/total_tokens=491,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2563/500000]
+ train/ActionL1Loss=0.0598
+ throughput/total_tokens=492,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2564/500000]
+ train/ActionL1Loss=0.0581
+ throughput/total_tokens=492,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2565/500000]
+ train/ActionL1Loss=0.0765
+ throughput/total_tokens=492,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2566/500000]
+ train/ActionL1Loss=0.0702
+ throughput/total_tokens=492,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2567/500000]
+ train/ActionL1Loss=0.0798
+ throughput/total_tokens=492,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2568/500000]
+ train/ActionL1Loss=0.0663
+ throughput/total_tokens=493,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2569/500000]
+ train/ActionL1Loss=0.0738
+ throughput/total_tokens=493,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2570/500000]
+ train/ActionL1Loss=0.0689
+ throughput/total_tokens=493,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2571/500000]
+ train/ActionL1Loss=0.0750
+ throughput/total_tokens=493,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2572/500000]
+ train/ActionL1Loss=0.0837
+ throughput/total_tokens=493,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2573/500000]
+ train/ActionL1Loss=0.0752
+ throughput/total_tokens=494,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2574/500000]
+ train/ActionL1Loss=0.0953
+ throughput/total_tokens=494,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2575/500000]
+ train/ActionL1Loss=0.0655
+ throughput/total_tokens=494,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2576/500000]
+ train/ActionL1Loss=0.0719
+ throughput/total_tokens=494,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2577/500000]
+ train/ActionL1Loss=0.0902
+ throughput/total_tokens=494,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2578/500000]
+ train/ActionL1Loss=0.0690
+ throughput/total_tokens=494,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2579/500000]
+ train/ActionL1Loss=0.0841
+ throughput/total_tokens=495,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2580/500000]
+ optim/total_grad_norm=6.830
+ train/ActionL1Loss=0.0725
+ throughput/total_tokens=495,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2581/500000]
+ train/ActionL1Loss=0.0617
+ throughput/total_tokens=495,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2582/500000]
+ train/ActionL1Loss=0.0750
+ throughput/total_tokens=495,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2583/500000]
+ train/ActionL1Loss=0.0584
+ throughput/total_tokens=495,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2584/500000]
+ train/ActionL1Loss=0.0589
+ throughput/total_tokens=496,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2585/500000]
+ train/ActionL1Loss=0.0597
+ throughput/total_tokens=496,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2586/500000]
+ train/ActionL1Loss=0.0789
+ throughput/total_tokens=496,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2587/500000]
+ train/ActionL1Loss=0.0577
+ throughput/total_tokens=496,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2588/500000]
+ train/ActionL1Loss=0.0647
+ throughput/total_tokens=496,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2589/500000]
+ train/ActionL1Loss=0.0801
+ throughput/total_tokens=497,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2590/500000]
+ train/ActionL1Loss=0.0589
+ throughput/total_tokens=497,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2591/500000]
+ train/ActionL1Loss=0.0731
+ throughput/total_tokens=497,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2592/500000]
+ train/ActionL1Loss=0.0589
+ throughput/total_tokens=497,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2593/500000]
+ train/ActionL1Loss=0.0671
+ throughput/total_tokens=497,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2594/500000]
+ train/ActionL1Loss=0.0602
+ throughput/total_tokens=498,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2595/500000]
+ train/ActionL1Loss=0.0619
+ throughput/total_tokens=498,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2596/500000]
+ train/ActionL1Loss=0.0781
+ throughput/total_tokens=498,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2597/500000]
+ train/ActionL1Loss=0.0765
+ throughput/total_tokens=498,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2598/500000]
+ train/ActionL1Loss=0.0676
+ throughput/total_tokens=498,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2599/500000]
+ train/ActionL1Loss=0.0745
+ throughput/total_tokens=499,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2600/500000]
+ optim/total_grad_norm=7.630
+ train/ActionL1Loss=0.0667
+ throughput/total_tokens=499,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2601/500000]
+ train/ActionL1Loss=0.0775
+ throughput/total_tokens=499,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2602/500000]
+ train/ActionL1Loss=0.0730
+ throughput/total_tokens=499,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2603/500000]
+ train/ActionL1Loss=0.0719
+ throughput/total_tokens=499,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2604/500000]
+ train/ActionL1Loss=0.0719
+ throughput/total_tokens=499,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2605/500000]
+ train/ActionL1Loss=0.0665
+ throughput/total_tokens=500,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2606/500000]
+ train/ActionL1Loss=0.0671
+ throughput/total_tokens=500,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2607/500000]
+ train/ActionL1Loss=0.0586
+ throughput/total_tokens=500,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2608/500000]
+ train/ActionL1Loss=0.0588
+ throughput/total_tokens=500,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2609/500000]
+ train/ActionL1Loss=0.0673
+ throughput/total_tokens=500,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2610/500000]
+ train/ActionL1Loss=0.0595
+ throughput/total_tokens=501,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=2611/500000]
+ train/ActionL1Loss=0.0725
+ throughput/total_tokens=501,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2612/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=501,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2613/500000]
+ train/ActionL1Loss=0.0601
+ throughput/total_tokens=501,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2614/500000]
+ train/ActionL1Loss=0.0651
+ throughput/total_tokens=501,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2615/500000]
+ train/ActionL1Loss=0.0583
+ throughput/total_tokens=502,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2616/500000]
+ train/ActionL1Loss=0.0552
+ throughput/total_tokens=502,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2617/500000]
+ train/ActionL1Loss=0.0664
+ throughput/total_tokens=502,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2618/500000]
+ train/ActionL1Loss=0.0734
+ throughput/total_tokens=502,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2619/500000]
+ train/ActionL1Loss=0.0569
+ throughput/total_tokens=502,848,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=2620/500000]
+ optim/total_grad_norm=6.965
+ train/ActionL1Loss=0.0830
+ throughput/total_tokens=503,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2621/500000]
+ train/ActionL1Loss=0.0718
+ throughput/total_tokens=503,232,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2622/500000]
+ train/ActionL1Loss=0.0650
+ throughput/total_tokens=503,424,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2623/500000]
+ train/ActionL1Loss=0.0608
+ throughput/total_tokens=503,616,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2624/500000]
+ train/ActionL1Loss=0.0764
+ throughput/total_tokens=503,808,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2625/500000]
+ train/ActionL1Loss=0.0702
+ throughput/total_tokens=504,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2626/500000]
+ train/ActionL1Loss=0.0739
+ throughput/total_tokens=504,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2627/500000]
+ train/ActionL1Loss=0.0890
+ throughput/total_tokens=504,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2628/500000]
+ train/ActionL1Loss=0.0689
+ throughput/total_tokens=504,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2629/500000]
+ train/ActionL1Loss=0.0653
+ throughput/total_tokens=504,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2630/500000]
+ train/ActionL1Loss=0.0793
+ throughput/total_tokens=504,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2631/500000]
+ train/ActionL1Loss=0.0701
+ throughput/total_tokens=505,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2632/500000]
+ train/ActionL1Loss=0.0840
+ throughput/total_tokens=505,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2633/500000]
+ train/ActionL1Loss=0.0661
+ throughput/total_tokens=505,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2634/500000]
+ train/ActionL1Loss=0.0701
+ throughput/total_tokens=505,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2635/500000]
+ train/ActionL1Loss=0.0710
+ throughput/total_tokens=505,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2636/500000]
+ train/ActionL1Loss=0.0601
+ throughput/total_tokens=506,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2637/500000]
+ train/ActionL1Loss=0.0660
+ throughput/total_tokens=506,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2638/500000]
+ train/ActionL1Loss=0.0649
+ throughput/total_tokens=506,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2639/500000]
+ train/ActionL1Loss=0.0618
+ throughput/total_tokens=506,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2640/500000]
+ optim/total_grad_norm=7.522
+ train/ActionL1Loss=0.0581
+ throughput/total_tokens=506,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2641/500000]
+ train/ActionL1Loss=0.0681
+ throughput/total_tokens=507,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2642/500000]
+ train/ActionL1Loss=0.0627
+ throughput/total_tokens=507,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2643/500000]
+ train/ActionL1Loss=0.0624
+ throughput/total_tokens=507,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2644/500000]
+ train/ActionL1Loss=0.0567
+ throughput/total_tokens=507,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2645/500000]
+ train/ActionL1Loss=0.0686
+ throughput/total_tokens=507,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2646/500000]
+ train/ActionL1Loss=0.0682
+ throughput/total_tokens=508,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2647/500000]
+ train/ActionL1Loss=0.0601
+ throughput/total_tokens=508,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2648/500000]
+ train/ActionL1Loss=0.0683
+ throughput/total_tokens=508,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2649/500000]
+ train/ActionL1Loss=0.0698
+ throughput/total_tokens=508,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2650/500000]
+ train/ActionL1Loss=0.0623
+ throughput/total_tokens=508,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2651/500000]
+ train/ActionL1Loss=0.0680
+ throughput/total_tokens=508,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2652/500000]
+ train/ActionL1Loss=0.0608
+ throughput/total_tokens=509,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2653/500000]
+ train/ActionL1Loss=0.0521
+ throughput/total_tokens=509,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2654/500000]
+ train/ActionL1Loss=0.0682
+ throughput/total_tokens=509,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2655/500000]
+ train/ActionL1Loss=0.0780
+ throughput/total_tokens=509,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2656/500000]
+ train/ActionL1Loss=0.0544
+ throughput/total_tokens=509,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2657/500000]
+ train/ActionL1Loss=0.0513
+ throughput/total_tokens=510,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2658/500000]
+ train/ActionL1Loss=0.0610
+ throughput/total_tokens=510,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2659/500000]
+ train/ActionL1Loss=0.0642
+ throughput/total_tokens=510,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2660/500000]
+ optim/total_grad_norm=8.934
+ train/ActionL1Loss=0.0630
+ throughput/total_tokens=510,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2661/500000]
+ train/ActionL1Loss=0.0558
+ throughput/total_tokens=510,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2662/500000]
+ train/ActionL1Loss=0.0532
+ throughput/total_tokens=511,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2663/500000]
+ train/ActionL1Loss=0.0694
+ throughput/total_tokens=511,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2664/500000]
+ train/ActionL1Loss=0.0682
+ throughput/total_tokens=511,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2665/500000]
+ train/ActionL1Loss=0.0814
+ throughput/total_tokens=511,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2666/500000]
+ train/ActionL1Loss=0.0608
+ throughput/total_tokens=511,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2667/500000]
+ train/ActionL1Loss=0.0553
+ throughput/total_tokens=512,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2668/500000]
+ train/ActionL1Loss=0.0545
+ throughput/total_tokens=512,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2669/500000]
+ train/ActionL1Loss=0.0592
+ throughput/total_tokens=512,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2670/500000]
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=512,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2671/500000]
+ train/ActionL1Loss=0.0583
+ throughput/total_tokens=512,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2672/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=513,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2673/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=513,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2674/500000]
+ train/ActionL1Loss=0.0681
+ throughput/total_tokens=513,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2675/500000]
+ train/ActionL1Loss=0.0591
+ throughput/total_tokens=513,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2676/500000]
+ train/ActionL1Loss=0.0521
+ throughput/total_tokens=513,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2677/500000]
+ train/ActionL1Loss=0.0687
+ throughput/total_tokens=513,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2678/500000]
+ train/ActionL1Loss=0.0814
+ throughput/total_tokens=514,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2679/500000]
+ train/ActionL1Loss=0.0600
+ throughput/total_tokens=514,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2680/500000]
+ optim/total_grad_norm=8.684
+ train/ActionL1Loss=0.0536
+ throughput/total_tokens=514,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2681/500000]
+ train/ActionL1Loss=0.0509
+ throughput/total_tokens=514,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2682/500000]
+ train/ActionL1Loss=0.0611
+ throughput/total_tokens=514,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2683/500000]
+ train/ActionL1Loss=0.0594
+ throughput/total_tokens=515,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2684/500000]
+ train/ActionL1Loss=0.0719
+ throughput/total_tokens=515,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2685/500000]
+ train/ActionL1Loss=0.0563
+ throughput/total_tokens=515,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2686/500000]
+ train/ActionL1Loss=0.0834
+ throughput/total_tokens=515,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2687/500000]
+ train/ActionL1Loss=0.0561
+ throughput/total_tokens=515,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2688/500000]
+ train/ActionL1Loss=0.0502
+ throughput/total_tokens=516,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2689/500000]
+ train/ActionL1Loss=0.0593
+ throughput/total_tokens=516,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2690/500000]
+ train/ActionL1Loss=0.0605
+ throughput/total_tokens=516,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2691/500000]
+ train/ActionL1Loss=0.0655
+ throughput/total_tokens=516,672,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2692/500000]
+ train/ActionL1Loss=0.0537
+ throughput/total_tokens=516,864,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2693/500000]
+ train/ActionL1Loss=0.0619
+ throughput/total_tokens=517,056,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2694/500000]
+ train/ActionL1Loss=0.0552
+ throughput/total_tokens=517,248,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2695/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=517,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2696/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=517,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2697/500000]
+ train/ActionL1Loss=0.0526
+ throughput/total_tokens=517,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2698/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=518,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2699/500000]
+ train/ActionL1Loss=0.0513
+ throughput/total_tokens=518,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2700/500000]
+ optim/total_grad_norm=10.06
+ train/ActionL1Loss=0.0542
+ throughput/total_tokens=518,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2701/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=518,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2702/500000]
+ train/ActionL1Loss=0.0539
+ throughput/total_tokens=518,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2703/500000]
+ train/ActionL1Loss=0.0519
+ throughput/total_tokens=518,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2704/500000]
+ train/ActionL1Loss=0.0524
+ throughput/total_tokens=519,168,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2705/500000]
+ train/ActionL1Loss=0.0502
+ throughput/total_tokens=519,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2706/500000]
+ train/ActionL1Loss=0.0543
+ throughput/total_tokens=519,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2707/500000]
+ train/ActionL1Loss=0.0564
+ throughput/total_tokens=519,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2708/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=519,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2709/500000]
+ train/ActionL1Loss=0.0565
+ throughput/total_tokens=520,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2710/500000]
+ train/ActionL1Loss=0.0622
+ throughput/total_tokens=520,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=2711/500000]
+ train/ActionL1Loss=0.0571
+ throughput/total_tokens=520,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2712/500000]
+ train/ActionL1Loss=0.0517
+ throughput/total_tokens=520,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2713/500000]
+ train/ActionL1Loss=0.0552
+ throughput/total_tokens=520,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2714/500000]
+ train/ActionL1Loss=0.0583
+ throughput/total_tokens=521,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2715/500000]
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=521,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2716/500000]
+ train/ActionL1Loss=0.0562
+ throughput/total_tokens=521,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2717/500000]
+ train/ActionL1Loss=0.0642
+ throughput/total_tokens=521,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2718/500000]
+ train/ActionL1Loss=0.0518
+ throughput/total_tokens=521,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2719/500000]
+ train/ActionL1Loss=0.0673
+ throughput/total_tokens=522,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2720/500000]
+ optim/total_grad_norm=8.877
+ train/ActionL1Loss=0.0623
+ throughput/total_tokens=522,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2721/500000]
+ train/ActionL1Loss=0.0661
+ throughput/total_tokens=522,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2722/500000]
+ train/ActionL1Loss=0.0672
+ throughput/total_tokens=522,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2723/500000]
+ train/ActionL1Loss=0.0665
+ throughput/total_tokens=522,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2724/500000]
+ train/ActionL1Loss=0.0622
+ throughput/total_tokens=523,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2725/500000]
+ train/ActionL1Loss=0.0576
+ throughput/total_tokens=523,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2726/500000]
+ train/ActionL1Loss=0.0939
+ throughput/total_tokens=523,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2727/500000]
+ train/ActionL1Loss=0.0534
+ throughput/total_tokens=523,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2728/500000]
+ train/ActionL1Loss=0.0646
+ throughput/total_tokens=523,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2729/500000]
+ train/ActionL1Loss=0.0537
+ throughput/total_tokens=523,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2730/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=524,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2731/500000]
+ train/ActionL1Loss=0.0663
+ throughput/total_tokens=524,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2732/500000]
+ train/ActionL1Loss=0.0525
+ throughput/total_tokens=524,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2733/500000]
+ train/ActionL1Loss=0.0633
+ throughput/total_tokens=524,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2734/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=524,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2735/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=525,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2736/500000]
+ train/ActionL1Loss=0.0784
+ throughput/total_tokens=525,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2737/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=525,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2738/500000]
+ train/ActionL1Loss=0.0560
+ throughput/total_tokens=525,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2739/500000]
+ train/ActionL1Loss=0.0565
+ throughput/total_tokens=525,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2740/500000]
+ optim/total_grad_norm=8.114
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=526,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2741/500000]
+ train/ActionL1Loss=0.0630
+ throughput/total_tokens=526,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2742/500000]
+ train/ActionL1Loss=0.0535
+ throughput/total_tokens=526,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2743/500000]
+ train/ActionL1Loss=0.0584
+ throughput/total_tokens=526,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2744/500000]
+ train/ActionL1Loss=0.0574
+ throughput/total_tokens=526,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2745/500000]
+ train/ActionL1Loss=0.0636
+ throughput/total_tokens=527,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2746/500000]
+ train/ActionL1Loss=0.0737
+ throughput/total_tokens=527,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2747/500000]
+ train/ActionL1Loss=0.0539
+ throughput/total_tokens=527,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2748/500000]
+ train/ActionL1Loss=0.0621
+ throughput/total_tokens=527,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2749/500000]
+ train/ActionL1Loss=0.0498
+ throughput/total_tokens=527,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2750/500000]
+ train/ActionL1Loss=0.0548
+ throughput/total_tokens=528,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2751/500000]
+ train/ActionL1Loss=0.0578
+ throughput/total_tokens=528,192,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2752/500000]
+ train/ActionL1Loss=0.0477
+ throughput/total_tokens=528,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2753/500000]
+ train/ActionL1Loss=0.0561
+ throughput/total_tokens=528,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2754/500000]
+ train/ActionL1Loss=0.0495
+ throughput/total_tokens=528,768,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2755/500000]
+ train/ActionL1Loss=0.0551
+ throughput/total_tokens=528,960,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2756/500000]
+ train/ActionL1Loss=0.0522
+ throughput/total_tokens=529,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2757/500000]
+ train/ActionL1Loss=0.0545
+ throughput/total_tokens=529,344,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2758/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=529,536,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2759/500000]
+ train/ActionL1Loss=0.0628
+ throughput/total_tokens=529,728,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2760/500000]
+ optim/total_grad_norm=6.480
+ train/ActionL1Loss=0.0711
+ throughput/total_tokens=529,920,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=2761/500000]
+ train/ActionL1Loss=0.0603
+ throughput/total_tokens=530,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2762/500000]
+ train/ActionL1Loss=0.0546
+ throughput/total_tokens=530,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2763/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=530,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2764/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=530,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2765/500000]
+ train/ActionL1Loss=0.0592
+ throughput/total_tokens=530,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2766/500000]
+ train/ActionL1Loss=0.0678
+ throughput/total_tokens=531,072,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2767/500000]
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=531,264,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2768/500000]
+ train/ActionL1Loss=0.0750
+ throughput/total_tokens=531,456,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2769/500000]
+ train/ActionL1Loss=0.0721
+ throughput/total_tokens=531,648,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2770/500000]
+ train/ActionL1Loss=0.0545
+ throughput/total_tokens=531,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2771/500000]
+ train/ActionL1Loss=0.0583
+ throughput/total_tokens=532,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2772/500000]
+ train/ActionL1Loss=0.0616
+ throughput/total_tokens=532,224,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2773/500000]
+ train/ActionL1Loss=0.0598
+ throughput/total_tokens=532,416,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2774/500000]
+ train/ActionL1Loss=0.0588
+ throughput/total_tokens=532,608,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2775/500000]
+ train/ActionL1Loss=0.0573
+ throughput/total_tokens=532,800,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2776/500000]
+ train/ActionL1Loss=0.0533
+ throughput/total_tokens=532,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2777/500000]
+ train/ActionL1Loss=0.0565
+ throughput/total_tokens=533,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2778/500000]
+ train/ActionL1Loss=0.0582
+ throughput/total_tokens=533,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2779/500000]
+ train/ActionL1Loss=0.0572
+ throughput/total_tokens=533,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2780/500000]
+ optim/total_grad_norm=8.334
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=533,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2781/500000]
+ train/ActionL1Loss=0.0650
+ throughput/total_tokens=533,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2782/500000]
+ train/ActionL1Loss=0.0470
+ throughput/total_tokens=534,144,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2783/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=534,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2784/500000]
+ train/ActionL1Loss=0.0497
+ throughput/total_tokens=534,528,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2785/500000]
+ train/ActionL1Loss=0.0495
+ throughput/total_tokens=534,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2786/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=534,912,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2787/500000]
+ train/ActionL1Loss=0.0541
+ throughput/total_tokens=535,104,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2788/500000]
+ train/ActionL1Loss=0.0605
+ throughput/total_tokens=535,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2789/500000]
+ train/ActionL1Loss=0.0708
+ throughput/total_tokens=535,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2790/500000]
+ train/ActionL1Loss=0.0696
+ throughput/total_tokens=535,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2791/500000]
+ train/ActionL1Loss=0.0642
+ throughput/total_tokens=535,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2792/500000]
+ train/ActionL1Loss=0.0555
+ throughput/total_tokens=536,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2793/500000]
+ train/ActionL1Loss=0.0617
+ throughput/total_tokens=536,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2794/500000]
+ train/ActionL1Loss=0.0662
+ throughput/total_tokens=536,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2795/500000]
+ train/ActionL1Loss=0.0715
+ throughput/total_tokens=536,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2796/500000]
+ train/ActionL1Loss=0.0569
+ throughput/total_tokens=536,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2797/500000]
+ train/ActionL1Loss=0.0632
+ throughput/total_tokens=537,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2798/500000]
+ train/ActionL1Loss=0.0499
+ throughput/total_tokens=537,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2799/500000]
+ train/ActionL1Loss=0.0671
+ throughput/total_tokens=537,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2800/500000]
+ optim/total_grad_norm=8.132
+ train/ActionL1Loss=0.0600
+ throughput/total_tokens=537,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2801/500000]
+ train/ActionL1Loss=0.0670
+ throughput/total_tokens=537,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2802/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=537,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2803/500000]
+ train/ActionL1Loss=0.0725
+ throughput/total_tokens=538,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2804/500000]
+ train/ActionL1Loss=0.0750
+ throughput/total_tokens=538,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2805/500000]
+ train/ActionL1Loss=0.0669
+ throughput/total_tokens=538,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2806/500000]
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=538,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2807/500000]
+ train/ActionL1Loss=0.0574
+ throughput/total_tokens=538,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2808/500000]
+ train/ActionL1Loss=0.0537
+ throughput/total_tokens=539,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2809/500000]
+ train/ActionL1Loss=0.0497
+ throughput/total_tokens=539,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2810/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=539,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2811/500000]
+ train/ActionL1Loss=0.0642
+ throughput/total_tokens=539,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2812/500000]
+ train/ActionL1Loss=0.0515
+ throughput/total_tokens=539,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2813/500000]
+ train/ActionL1Loss=0.0617
+ throughput/total_tokens=540,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2814/500000]
+ train/ActionL1Loss=0.0531
+ throughput/total_tokens=540,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2815/500000]
+ train/ActionL1Loss=0.0538
+ throughput/total_tokens=540,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2816/500000]
+ train/ActionL1Loss=0.0505
+ throughput/total_tokens=540,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2817/500000]
+ train/ActionL1Loss=0.0524
+ throughput/total_tokens=540,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2818/500000]
+ train/ActionL1Loss=0.0487
+ throughput/total_tokens=541,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2819/500000]
+ train/ActionL1Loss=0.0567
+ throughput/total_tokens=541,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2820/500000]
+ optim/total_grad_norm=6.953
+ train/ActionL1Loss=0.0591
+ throughput/total_tokens=541,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2821/500000]
+ train/ActionL1Loss=0.0656
+ throughput/total_tokens=541,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2822/500000]
+ train/ActionL1Loss=0.0664
+ throughput/total_tokens=541,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2823/500000]
+ train/ActionL1Loss=0.0561
+ throughput/total_tokens=542,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2824/500000]
+ train/ActionL1Loss=0.0623
+ throughput/total_tokens=542,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2825/500000]
+ train/ActionL1Loss=0.0535
+ throughput/total_tokens=542,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2826/500000]
+ train/ActionL1Loss=0.0622
+ throughput/total_tokens=542,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2827/500000]
+ train/ActionL1Loss=0.0591
+ throughput/total_tokens=542,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2828/500000]
+ train/ActionL1Loss=0.0549
+ throughput/total_tokens=542,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2829/500000]
+ train/ActionL1Loss=0.0539
+ throughput/total_tokens=543,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2830/500000]
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=543,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2831/500000]
+ train/ActionL1Loss=0.0519
+ throughput/total_tokens=543,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2832/500000]
+ train/ActionL1Loss=0.0584
+ throughput/total_tokens=543,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2833/500000]
+ train/ActionL1Loss=0.0569
+ throughput/total_tokens=543,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2834/500000]
+ train/ActionL1Loss=0.0538
+ throughput/total_tokens=544,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2835/500000]
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=544,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2836/500000]
+ train/ActionL1Loss=0.0564
+ throughput/total_tokens=544,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2837/500000]
+ train/ActionL1Loss=0.0499
+ throughput/total_tokens=544,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2838/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=544,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2839/500000]
+ train/ActionL1Loss=0.0541
+ throughput/total_tokens=545,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2840/500000]
+ optim/total_grad_norm=8.744
+ train/ActionL1Loss=0.0492
+ throughput/total_tokens=545,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2841/500000]
+ train/ActionL1Loss=0.0517
+ throughput/total_tokens=545,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2842/500000]
+ train/ActionL1Loss=0.0458
+ throughput/total_tokens=545,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2843/500000]
+ train/ActionL1Loss=0.0579
+ throughput/total_tokens=545,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2844/500000]
+ train/ActionL1Loss=0.0488
+ throughput/total_tokens=546,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2845/500000]
+ train/ActionL1Loss=0.0537
+ throughput/total_tokens=546,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2846/500000]
+ train/ActionL1Loss=0.0520
+ throughput/total_tokens=546,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2847/500000]
+ train/ActionL1Loss=0.0604
+ throughput/total_tokens=546,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2848/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=546,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2849/500000]
+ train/ActionL1Loss=0.0559
+ throughput/total_tokens=547,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2850/500000]
+ train/ActionL1Loss=0.0545
+ throughput/total_tokens=547,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2851/500000]
+ train/ActionL1Loss=0.0536
+ throughput/total_tokens=547,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2852/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=547,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2853/500000]
+ train/ActionL1Loss=0.0564
+ throughput/total_tokens=547,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2854/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=547,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2855/500000]
+ train/ActionL1Loss=0.0565
+ throughput/total_tokens=548,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2856/500000]
+ train/ActionL1Loss=0.0496
+ throughput/total_tokens=548,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2857/500000]
+ train/ActionL1Loss=0.0533
+ throughput/total_tokens=548,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2858/500000]
+ train/ActionL1Loss=0.0485
+ throughput/total_tokens=548,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2859/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=548,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2860/500000]
+ optim/total_grad_norm=9.119
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=549,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=2861/500000]
+ train/ActionL1Loss=0.0506
+ throughput/total_tokens=549,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2862/500000]
+ train/ActionL1Loss=0.0547
+ throughput/total_tokens=549,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2863/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=549,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2864/500000]
+ train/ActionL1Loss=0.0499
+ throughput/total_tokens=549,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2865/500000]
+ train/ActionL1Loss=0.0531
+ throughput/total_tokens=550,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2866/500000]
+ train/ActionL1Loss=0.0564
+ throughput/total_tokens=550,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2867/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=550,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2868/500000]
+ train/ActionL1Loss=0.0523
+ throughput/total_tokens=550,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2869/500000]
+ train/ActionL1Loss=0.0585
+ throughput/total_tokens=550,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2870/500000]
+ train/ActionL1Loss=0.0526
+ throughput/total_tokens=551,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2871/500000]
+ train/ActionL1Loss=0.0524
+ throughput/total_tokens=551,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2872/500000]
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=551,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2873/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=551,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2874/500000]
+ train/ActionL1Loss=0.0468
+ throughput/total_tokens=551,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2875/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=552,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2876/500000]
+ train/ActionL1Loss=0.0508
+ throughput/total_tokens=552,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2877/500000]
+ train/ActionL1Loss=0.0592
+ throughput/total_tokens=552,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2878/500000]
+ train/ActionL1Loss=0.0599
+ throughput/total_tokens=552,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2879/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=552,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2880/500000]
+ optim/total_grad_norm=9.264
+ train/ActionL1Loss=0.0542
+ throughput/total_tokens=552,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2881/500000]
+ train/ActionL1Loss=0.0517
+ throughput/total_tokens=553,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2882/500000]
+ train/ActionL1Loss=0.0621
+ throughput/total_tokens=553,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2883/500000]
+ train/ActionL1Loss=0.0714
+ throughput/total_tokens=553,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2884/500000]
+ train/ActionL1Loss=0.0444
+ throughput/total_tokens=553,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2885/500000]
+ train/ActionL1Loss=0.0604
+ throughput/total_tokens=553,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2886/500000]
+ train/ActionL1Loss=0.0686
+ throughput/total_tokens=554,112,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2887/500000]
+ train/ActionL1Loss=0.0575
+ throughput/total_tokens=554,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2888/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=554,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2889/500000]
+ train/ActionL1Loss=0.0612
+ throughput/total_tokens=554,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2890/500000]
+ train/ActionL1Loss=0.0506
+ throughput/total_tokens=554,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2891/500000]
+ train/ActionL1Loss=0.0558
+ throughput/total_tokens=555,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2892/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=555,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2893/500000]
+ train/ActionL1Loss=0.0624
+ throughput/total_tokens=555,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2894/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=555,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2895/500000]
+ train/ActionL1Loss=0.0525
+ throughput/total_tokens=555,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2896/500000]
+ train/ActionL1Loss=0.0635
+ throughput/total_tokens=556,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2897/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=556,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2898/500000]
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=556,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2899/500000]
+ train/ActionL1Loss=0.0510
+ throughput/total_tokens=556,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2900/500000]
+ optim/total_grad_norm=8.568
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=556,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2901/500000]
+ train/ActionL1Loss=0.0555
+ throughput/total_tokens=556,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2902/500000]
+ train/ActionL1Loss=0.0599
+ throughput/total_tokens=557,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2903/500000]
+ train/ActionL1Loss=0.0514
+ throughput/total_tokens=557,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2904/500000]
+ train/ActionL1Loss=0.0564
+ throughput/total_tokens=557,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2905/500000]
+ train/ActionL1Loss=0.0500
+ throughput/total_tokens=557,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2906/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=557,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2907/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=558,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2908/500000]
+ train/ActionL1Loss=0.0569
+ throughput/total_tokens=558,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2909/500000]
+ train/ActionL1Loss=0.0568
+ throughput/total_tokens=558,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2910/500000]
+ train/ActionL1Loss=0.0523
+ throughput/total_tokens=558,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2911/500000]
+ train/ActionL1Loss=0.0542
+ throughput/total_tokens=558,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2912/500000]
+ train/ActionL1Loss=0.0509
+ throughput/total_tokens=559,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2913/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=559,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2914/500000]
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=559,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=2915/500000]
+ train/ActionL1Loss=0.0498
+ throughput/total_tokens=559,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2916/500000]
+ train/ActionL1Loss=0.0479
+ throughput/total_tokens=559,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2917/500000]
+ train/ActionL1Loss=0.0668
+ throughput/total_tokens=560,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2918/500000]
+ train/ActionL1Loss=0.0480
+ throughput/total_tokens=560,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2919/500000]
+ train/ActionL1Loss=0.0573
+ throughput/total_tokens=560,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=2920/500000]
+ optim/total_grad_norm=9.205
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=560,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2921/500000]
+ train/ActionL1Loss=0.0606
+ throughput/total_tokens=560,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2922/500000]
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=561,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2923/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=561,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2924/500000]
+ train/ActionL1Loss=0.0538
+ throughput/total_tokens=561,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2925/500000]
+ train/ActionL1Loss=0.0594
+ throughput/total_tokens=561,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2926/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=561,792,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2927/500000]
+ train/ActionL1Loss=0.0657
+ throughput/total_tokens=561,984,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2928/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=562,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2929/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=562,368,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2930/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=562,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2931/500000]
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=562,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2932/500000]
+ train/ActionL1Loss=0.0648
+ throughput/total_tokens=562,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2933/500000]
+ train/ActionL1Loss=0.0551
+ throughput/total_tokens=563,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2934/500000]
+ train/ActionL1Loss=0.0635
+ throughput/total_tokens=563,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2935/500000]
+ train/ActionL1Loss=0.0606
+ throughput/total_tokens=563,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2936/500000]
+ train/ActionL1Loss=0.0646
+ throughput/total_tokens=563,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2937/500000]
+ train/ActionL1Loss=0.0531
+ throughput/total_tokens=563,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2938/500000]
+ train/ActionL1Loss=0.0577
+ throughput/total_tokens=564,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2939/500000]
+ train/ActionL1Loss=0.0518
+ throughput/total_tokens=564,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2940/500000]
+ optim/total_grad_norm=8.464
+ train/ActionL1Loss=0.0654
+ throughput/total_tokens=564,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2941/500000]
+ train/ActionL1Loss=0.0568
+ throughput/total_tokens=564,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2942/500000]
+ train/ActionL1Loss=0.0572
+ throughput/total_tokens=564,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2943/500000]
+ train/ActionL1Loss=0.0659
+ throughput/total_tokens=565,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=2944/500000]
+ train/ActionL1Loss=0.0682
+ throughput/total_tokens=565,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2945/500000]
+ train/ActionL1Loss=0.0619
+ throughput/total_tokens=565,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=2946/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=565,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2947/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=565,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2948/500000]
+ train/ActionL1Loss=0.0515
+ throughput/total_tokens=566,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2949/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=566,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2950/500000]
+ train/ActionL1Loss=0.0564
+ throughput/total_tokens=566,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2951/500000]
+ train/ActionL1Loss=0.0633
+ throughput/total_tokens=566,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2952/500000]
+ train/ActionL1Loss=0.0525
+ throughput/total_tokens=566,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2953/500000]
+ train/ActionL1Loss=0.0606
+ throughput/total_tokens=566,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2954/500000]
+ train/ActionL1Loss=0.0737
+ throughput/total_tokens=567,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2955/500000]
+ train/ActionL1Loss=0.0675
+ throughput/total_tokens=567,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2956/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=567,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2957/500000]
+ train/ActionL1Loss=0.0678
+ throughput/total_tokens=567,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2958/500000]
+ train/ActionL1Loss=0.0555
+ throughput/total_tokens=567,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2959/500000]
+ train/ActionL1Loss=0.0625
+ throughput/total_tokens=568,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2960/500000]
+ optim/total_grad_norm=9.554
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=568,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=2961/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=568,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2962/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=568,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=2963/500000]
+ train/ActionL1Loss=0.0576
+ throughput/total_tokens=568,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2964/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=569,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2965/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=569,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2966/500000]
+ train/ActionL1Loss=0.0561
+ throughput/total_tokens=569,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2967/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=569,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2968/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=569,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2969/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=570,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=2970/500000]
+ train/ActionL1Loss=0.0563
+ throughput/total_tokens=570,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2971/500000]
+ train/ActionL1Loss=0.0585
+ throughput/total_tokens=570,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2972/500000]
+ train/ActionL1Loss=0.0400
+ throughput/total_tokens=570,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2973/500000]
+ train/ActionL1Loss=0.0470
+ throughput/total_tokens=570,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2974/500000]
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=571,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2975/500000]
+ train/ActionL1Loss=0.0637
+ throughput/total_tokens=571,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2976/500000]
+ train/ActionL1Loss=0.0571
+ throughput/total_tokens=571,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2977/500000]
+ train/ActionL1Loss=0.0636
+ throughput/total_tokens=571,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2978/500000]
+ train/ActionL1Loss=0.0558
+ throughput/total_tokens=571,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2979/500000]
+ train/ActionL1Loss=0.0588
+ throughput/total_tokens=571,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2980/500000]
+ optim/total_grad_norm=8.233
+ train/ActionL1Loss=0.0642
+ throughput/total_tokens=572,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2981/500000]
+ train/ActionL1Loss=0.0575
+ throughput/total_tokens=572,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2982/500000]
+ train/ActionL1Loss=0.0615
+ throughput/total_tokens=572,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2983/500000]
+ train/ActionL1Loss=0.0592
+ throughput/total_tokens=572,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2984/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=572,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2985/500000]
+ train/ActionL1Loss=0.0573
+ throughput/total_tokens=573,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2986/500000]
+ train/ActionL1Loss=0.0550
+ throughput/total_tokens=573,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2987/500000]
+ train/ActionL1Loss=0.0578
+ throughput/total_tokens=573,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2988/500000]
+ train/ActionL1Loss=0.0591
+ throughput/total_tokens=573,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2989/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=573,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2990/500000]
+ train/ActionL1Loss=0.0489
+ throughput/total_tokens=574,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=2991/500000]
+ train/ActionL1Loss=0.0623
+ throughput/total_tokens=574,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2992/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=574,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=2993/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=574,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2994/500000]
+ train/ActionL1Loss=0.0750
+ throughput/total_tokens=574,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2995/500000]
+ train/ActionL1Loss=0.0593
+ throughput/total_tokens=575,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2996/500000]
+ train/ActionL1Loss=0.0627
+ throughput/total_tokens=575,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2997/500000]
+ train/ActionL1Loss=0.0496
+ throughput/total_tokens=575,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2998/500000]
+ train/ActionL1Loss=0.0471
+ throughput/total_tokens=575,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=2999/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=575,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3000/500000]
+ optim/total_grad_norm=8.636
+ train/ActionL1Loss=0.0538
+ throughput/total_tokens=576,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/03 [09:56:52] INFO | >> Saving config... checkpoint.py:608
+10/03 [09:57:34] INFO | >> Saving model state... checkpoint.py:796
+10/03 [09:58:44] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [10:00:08] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3001/500000]
+ train/ActionL1Loss=0.0521
+ throughput/total_tokens=576,192,000
+ throughput/device/tokens_per_second=1,224
+ throughput/device/batches_per_second=0.0510
+[step=3002/500000]
+ train/ActionL1Loss=0.0520
+ throughput/total_tokens=576,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3003/500000]
+ train/ActionL1Loss=0.0626
+ throughput/total_tokens=576,576,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=3004/500000]
+ train/ActionL1Loss=0.0594
+ throughput/total_tokens=576,768,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=3005/500000]
+ train/ActionL1Loss=0.0592
+ throughput/total_tokens=576,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3006/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=577,152,000
+ throughput/device/tokens_per_second=1,159
+ throughput/device/batches_per_second=0.0483
+[step=3007/500000]
+ train/ActionL1Loss=0.0611
+ throughput/total_tokens=577,344,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=3008/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=577,536,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=3009/500000]
+ train/ActionL1Loss=0.0502
+ throughput/total_tokens=577,728,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=3010/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=577,920,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+ System/Peak GPU Memory (MB)=46,917
+[step=3011/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=578,112,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=3012/500000]
+ train/ActionL1Loss=0.0540
+ throughput/total_tokens=578,304,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=3013/500000]
+ train/ActionL1Loss=0.0517
+ throughput/total_tokens=578,496,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=3014/500000]
+ train/ActionL1Loss=0.0552
+ throughput/total_tokens=578,688,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=3015/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=578,880,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=3016/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=579,072,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=3017/500000]
+ train/ActionL1Loss=0.0536
+ throughput/total_tokens=579,264,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=3018/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=579,456,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=3019/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=579,648,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=3020/500000]
+ optim/total_grad_norm=7.478
+ train/ActionL1Loss=0.0538
+ throughput/total_tokens=579,840,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0490
+ System/Peak GPU Memory (MB)=46,917
+[step=3021/500000]
+ train/ActionL1Loss=0.0604
+ throughput/total_tokens=580,032,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=3022/500000]
+ train/ActionL1Loss=0.0625
+ throughput/total_tokens=580,224,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=3023/500000]
+ train/ActionL1Loss=0.0510
+ throughput/total_tokens=580,416,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3024/500000]
+ train/ActionL1Loss=0.0444
+ throughput/total_tokens=580,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3025/500000]
+ train/ActionL1Loss=0.0541
+ throughput/total_tokens=580,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3026/500000]
+ train/ActionL1Loss=0.0573
+ throughput/total_tokens=580,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3027/500000]
+ train/ActionL1Loss=0.0488
+ throughput/total_tokens=581,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3028/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=581,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3029/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=581,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3030/500000]
+ train/ActionL1Loss=0.0497
+ throughput/total_tokens=581,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3031/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=581,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3032/500000]
+ train/ActionL1Loss=0.0571
+ throughput/total_tokens=582,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3033/500000]
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=582,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3034/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=582,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3035/500000]
+ train/ActionL1Loss=0.0517
+ throughput/total_tokens=582,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3036/500000]
+ train/ActionL1Loss=0.0624
+ throughput/total_tokens=582,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3037/500000]
+ train/ActionL1Loss=0.0553
+ throughput/total_tokens=583,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3038/500000]
+ train/ActionL1Loss=0.0546
+ throughput/total_tokens=583,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3039/500000]
+ train/ActionL1Loss=0.0569
+ throughput/total_tokens=583,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3040/500000]
+ optim/total_grad_norm=6.944
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=583,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3041/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=583,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3042/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=584,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3043/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=584,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3044/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=584,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3045/500000]
+ train/ActionL1Loss=0.0496
+ throughput/total_tokens=584,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3046/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=584,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3047/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=585,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3048/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=585,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3049/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=585,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3050/500000]
+ train/ActionL1Loss=0.0517
+ throughput/total_tokens=585,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3051/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=585,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3052/500000]
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=585,984,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3053/500000]
+ train/ActionL1Loss=0.0506
+ throughput/total_tokens=586,176,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3054/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=586,368,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3055/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=586,560,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3056/500000]
+ train/ActionL1Loss=0.0558
+ throughput/total_tokens=586,752,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3057/500000]
+ train/ActionL1Loss=0.0482
+ throughput/total_tokens=586,944,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3058/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=587,136,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3059/500000]
+ train/ActionL1Loss=0.0566
+ throughput/total_tokens=587,328,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3060/500000]
+ optim/total_grad_norm=8.008
+ train/ActionL1Loss=0.0518
+ throughput/total_tokens=587,520,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3061/500000]
+ train/ActionL1Loss=0.0652
+ throughput/total_tokens=587,712,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3062/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=587,904,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3063/500000]
+ train/ActionL1Loss=0.0546
+ throughput/total_tokens=588,096,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3064/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=588,288,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3065/500000]
+ train/ActionL1Loss=0.0625
+ throughput/total_tokens=588,480,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3066/500000]
+ train/ActionL1Loss=0.0683
+ throughput/total_tokens=588,672,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3067/500000]
+ train/ActionL1Loss=0.0642
+ throughput/total_tokens=588,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3068/500000]
+ train/ActionL1Loss=0.0769
+ throughput/total_tokens=589,056,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3069/500000]
+ train/ActionL1Loss=0.0600
+ throughput/total_tokens=589,248,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3070/500000]
+ train/ActionL1Loss=0.0618
+ throughput/total_tokens=589,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3071/500000]
+ train/ActionL1Loss=0.0562
+ throughput/total_tokens=589,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3072/500000]
+ train/ActionL1Loss=0.0583
+ throughput/total_tokens=589,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3073/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=590,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3074/500000]
+ train/ActionL1Loss=0.0549
+ throughput/total_tokens=590,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3075/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=590,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3076/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=590,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3077/500000]
+ train/ActionL1Loss=0.0524
+ throughput/total_tokens=590,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3078/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=590,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3079/500000]
+ train/ActionL1Loss=0.0470
+ throughput/total_tokens=591,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3080/500000]
+ optim/total_grad_norm=8.949
+ train/ActionL1Loss=0.0484
+ throughput/total_tokens=591,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3081/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=591,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3082/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=591,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3083/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=591,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3084/500000]
+ train/ActionL1Loss=0.0495
+ throughput/total_tokens=592,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3085/500000]
+ train/ActionL1Loss=0.0544
+ throughput/total_tokens=592,320,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3086/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=592,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3087/500000]
+ train/ActionL1Loss=0.0534
+ throughput/total_tokens=592,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3088/500000]
+ train/ActionL1Loss=0.0484
+ throughput/total_tokens=592,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3089/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=593,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3090/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=593,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3091/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=593,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3092/500000]
+ train/ActionL1Loss=0.0567
+ throughput/total_tokens=593,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3093/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=593,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3094/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=594,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3095/500000]
+ train/ActionL1Loss=0.0549
+ throughput/total_tokens=594,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3096/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=594,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3097/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=594,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3098/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=594,816,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=3099/500000]
+ train/ActionL1Loss=0.0413
+ throughput/total_tokens=595,008,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=3100/500000]
+ optim/total_grad_norm=9.288
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=595,200,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=3101/500000]
+ train/ActionL1Loss=0.0463
+ throughput/total_tokens=595,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3102/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=595,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3103/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=595,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3104/500000]
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=595,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3105/500000]
+ train/ActionL1Loss=0.0482
+ throughput/total_tokens=596,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3106/500000]
+ train/ActionL1Loss=0.0514
+ throughput/total_tokens=596,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3107/500000]
+ train/ActionL1Loss=0.0553
+ throughput/total_tokens=596,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3108/500000]
+ train/ActionL1Loss=0.0495
+ throughput/total_tokens=596,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3109/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=596,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3110/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=597,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3111/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=597,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3112/500000]
+ train/ActionL1Loss=0.0524
+ throughput/total_tokens=597,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3113/500000]
+ train/ActionL1Loss=0.0478
+ throughput/total_tokens=597,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3114/500000]
+ train/ActionL1Loss=0.0568
+ throughput/total_tokens=597,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3115/500000]
+ train/ActionL1Loss=0.0576
+ throughput/total_tokens=598,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3116/500000]
+ train/ActionL1Loss=0.0543
+ throughput/total_tokens=598,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3117/500000]
+ train/ActionL1Loss=0.0584
+ throughput/total_tokens=598,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3118/500000]
+ train/ActionL1Loss=0.0493
+ throughput/total_tokens=598,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3119/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=598,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3120/500000]
+ optim/total_grad_norm=7.200
+ train/ActionL1Loss=0.0532
+ throughput/total_tokens=599,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3121/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=599,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3122/500000]
+ train/ActionL1Loss=0.0495
+ throughput/total_tokens=599,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3123/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=599,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3124/500000]
+ train/ActionL1Loss=0.0579
+ throughput/total_tokens=599,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3125/500000]
+ train/ActionL1Loss=0.0492
+ throughput/total_tokens=600,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3126/500000]
+ train/ActionL1Loss=0.0484
+ throughput/total_tokens=600,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3127/500000]
+ train/ActionL1Loss=0.0509
+ throughput/total_tokens=600,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3128/500000]
+ train/ActionL1Loss=0.0550
+ throughput/total_tokens=600,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3129/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=600,768,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3130/500000]
+ train/ActionL1Loss=0.0661
+ throughput/total_tokens=600,960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3131/500000]
+ train/ActionL1Loss=0.0463
+ throughput/total_tokens=601,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3132/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=601,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3133/500000]
+ train/ActionL1Loss=0.0527
+ throughput/total_tokens=601,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3134/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=601,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3135/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=601,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3136/500000]
+ train/ActionL1Loss=0.0465
+ throughput/total_tokens=602,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3137/500000]
+ train/ActionL1Loss=0.0412
+ throughput/total_tokens=602,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3138/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=602,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3139/500000]
+ train/ActionL1Loss=0.0498
+ throughput/total_tokens=602,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3140/500000]
+ optim/total_grad_norm=7.471
+ train/ActionL1Loss=0.0578
+ throughput/total_tokens=602,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3141/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=603,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3142/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=603,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3143/500000]
+ train/ActionL1Loss=0.0545
+ throughput/total_tokens=603,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3144/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=603,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3145/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=603,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3146/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=604,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3147/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=604,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3148/500000]
+ train/ActionL1Loss=0.0664
+ throughput/total_tokens=604,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3149/500000]
+ train/ActionL1Loss=0.0647
+ throughput/total_tokens=604,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3150/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=604,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3151/500000]
+ train/ActionL1Loss=0.0547
+ throughput/total_tokens=604,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3152/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=605,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3153/500000]
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=605,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3154/500000]
+ train/ActionL1Loss=0.0548
+ throughput/total_tokens=605,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3155/500000]
+ train/ActionL1Loss=0.0502
+ throughput/total_tokens=605,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3156/500000]
+ train/ActionL1Loss=0.0576
+ throughput/total_tokens=605,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3157/500000]
+ train/ActionL1Loss=0.0610
+ throughput/total_tokens=606,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3158/500000]
+ train/ActionL1Loss=0.0741
+ throughput/total_tokens=606,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3159/500000]
+ train/ActionL1Loss=0.0517
+ throughput/total_tokens=606,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3160/500000]
+ optim/total_grad_norm=7.145
+ train/ActionL1Loss=0.0502
+ throughput/total_tokens=606,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3161/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=606,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3162/500000]
+ train/ActionL1Loss=0.0590
+ throughput/total_tokens=607,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3163/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=607,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3164/500000]
+ train/ActionL1Loss=0.0549
+ throughput/total_tokens=607,488,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3165/500000]
+ train/ActionL1Loss=0.0556
+ throughput/total_tokens=607,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3166/500000]
+ train/ActionL1Loss=0.0532
+ throughput/total_tokens=607,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3167/500000]
+ train/ActionL1Loss=0.0580
+ throughput/total_tokens=608,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3168/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=608,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3169/500000]
+ train/ActionL1Loss=0.0699
+ throughput/total_tokens=608,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3170/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=608,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3171/500000]
+ train/ActionL1Loss=0.0542
+ throughput/total_tokens=608,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3172/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=609,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3173/500000]
+ train/ActionL1Loss=0.0533
+ throughput/total_tokens=609,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3174/500000]
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=609,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3175/500000]
+ train/ActionL1Loss=0.0521
+ throughput/total_tokens=609,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3176/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=609,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3177/500000]
+ train/ActionL1Loss=0.0458
+ throughput/total_tokens=609,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3178/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=610,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3179/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=610,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3180/500000]
+ optim/total_grad_norm=9.396
+ train/ActionL1Loss=0.0513
+ throughput/total_tokens=610,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3181/500000]
+ train/ActionL1Loss=0.0477
+ throughput/total_tokens=610,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3182/500000]
+ train/ActionL1Loss=0.0565
+ throughput/total_tokens=610,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3183/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=611,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3184/500000]
+ train/ActionL1Loss=0.0590
+ throughput/total_tokens=611,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3185/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=611,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3186/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=611,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3187/500000]
+ train/ActionL1Loss=0.0480
+ throughput/total_tokens=611,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3188/500000]
+ train/ActionL1Loss=0.0631
+ throughput/total_tokens=612,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3189/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=612,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3190/500000]
+ train/ActionL1Loss=0.0598
+ throughput/total_tokens=612,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3191/500000]
+ train/ActionL1Loss=0.0612
+ throughput/total_tokens=612,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3192/500000]
+ train/ActionL1Loss=0.0518
+ throughput/total_tokens=612,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3193/500000]
+ train/ActionL1Loss=0.0574
+ throughput/total_tokens=613,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3194/500000]
+ train/ActionL1Loss=0.0489
+ throughput/total_tokens=613,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3195/500000]
+ train/ActionL1Loss=0.0480
+ throughput/total_tokens=613,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3196/500000]
+ train/ActionL1Loss=0.0622
+ throughput/total_tokens=613,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3197/500000]
+ train/ActionL1Loss=0.0509
+ throughput/total_tokens=613,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3198/500000]
+ train/ActionL1Loss=0.0550
+ throughput/total_tokens=614,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3199/500000]
+ train/ActionL1Loss=0.0582
+ throughput/total_tokens=614,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3200/500000]
+ optim/total_grad_norm=10.80
+ train/ActionL1Loss=0.0678
+ throughput/total_tokens=614,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3201/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=614,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3202/500000]
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=614,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3203/500000]
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=614,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3204/500000]
+ train/ActionL1Loss=0.0675
+ throughput/total_tokens=615,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3205/500000]
+ train/ActionL1Loss=0.0567
+ throughput/total_tokens=615,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3206/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=615,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3207/500000]
+ train/ActionL1Loss=0.0674
+ throughput/total_tokens=615,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3208/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=615,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3209/500000]
+ train/ActionL1Loss=0.0543
+ throughput/total_tokens=616,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3210/500000]
+ train/ActionL1Loss=0.0609
+ throughput/total_tokens=616,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3211/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=616,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3212/500000]
+ train/ActionL1Loss=0.0477
+ throughput/total_tokens=616,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3213/500000]
+ train/ActionL1Loss=0.0543
+ throughput/total_tokens=616,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3214/500000]
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=617,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3215/500000]
+ train/ActionL1Loss=0.0548
+ throughput/total_tokens=617,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3216/500000]
+ train/ActionL1Loss=0.0559
+ throughput/total_tokens=617,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3217/500000]
+ train/ActionL1Loss=0.0521
+ throughput/total_tokens=617,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3218/500000]
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=617,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3219/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=618,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3220/500000]
+ optim/total_grad_norm=6.170
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=618,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3221/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=618,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3222/500000]
+ train/ActionL1Loss=0.0526
+ throughput/total_tokens=618,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3223/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=618,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3224/500000]
+ train/ActionL1Loss=0.0587
+ throughput/total_tokens=619,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3225/500000]
+ train/ActionL1Loss=0.0532
+ throughput/total_tokens=619,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3226/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=619,392,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3227/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=619,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3228/500000]
+ train/ActionL1Loss=0.0537
+ throughput/total_tokens=619,776,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3229/500000]
+ train/ActionL1Loss=0.0553
+ throughput/total_tokens=619,968,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3230/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=620,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3231/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=620,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3232/500000]
+ train/ActionL1Loss=0.0514
+ throughput/total_tokens=620,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3233/500000]
+ train/ActionL1Loss=0.0498
+ throughput/total_tokens=620,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3234/500000]
+ train/ActionL1Loss=0.0595
+ throughput/total_tokens=620,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3235/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=621,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3236/500000]
+ train/ActionL1Loss=0.0471
+ throughput/total_tokens=621,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3237/500000]
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=621,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3238/500000]
+ train/ActionL1Loss=0.0558
+ throughput/total_tokens=621,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3239/500000]
+ train/ActionL1Loss=0.0549
+ throughput/total_tokens=621,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3240/500000]
+ optim/total_grad_norm=7.371
+ train/ActionL1Loss=0.0654
+ throughput/total_tokens=622,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3241/500000]
+ train/ActionL1Loss=0.0604
+ throughput/total_tokens=622,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3242/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=622,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3243/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=622,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3244/500000]
+ train/ActionL1Loss=0.0510
+ throughput/total_tokens=622,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3245/500000]
+ train/ActionL1Loss=0.0600
+ throughput/total_tokens=623,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3246/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=623,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3247/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=623,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3248/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=623,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3249/500000]
+ train/ActionL1Loss=0.0486
+ throughput/total_tokens=623,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3250/500000]
+ train/ActionL1Loss=0.0522
+ throughput/total_tokens=624,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3251/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=624,192,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3252/500000]
+ train/ActionL1Loss=0.0482
+ throughput/total_tokens=624,384,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3253/500000]
+ train/ActionL1Loss=0.0513
+ throughput/total_tokens=624,576,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3254/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=624,768,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3255/500000]
+ train/ActionL1Loss=0.0729
+ throughput/total_tokens=624,960,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3256/500000]
+ train/ActionL1Loss=0.0539
+ throughput/total_tokens=625,152,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3257/500000]
+ train/ActionL1Loss=0.0504
+ throughput/total_tokens=625,344,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3258/500000]
+ train/ActionL1Loss=0.0545
+ throughput/total_tokens=625,536,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3259/500000]
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=625,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3260/500000]
+ optim/total_grad_norm=9.771
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=625,920,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3261/500000]
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=626,112,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3262/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=626,304,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3263/500000]
+ train/ActionL1Loss=0.0652
+ throughput/total_tokens=626,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3264/500000]
+ train/ActionL1Loss=0.0666
+ throughput/total_tokens=626,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3265/500000]
+ train/ActionL1Loss=0.0603
+ throughput/total_tokens=626,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3266/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=627,072,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3267/500000]
+ train/ActionL1Loss=0.0575
+ throughput/total_tokens=627,264,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3268/500000]
+ train/ActionL1Loss=0.0498
+ throughput/total_tokens=627,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3269/500000]
+ train/ActionL1Loss=0.0574
+ throughput/total_tokens=627,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3270/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=627,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3271/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=628,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3272/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=628,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3273/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=628,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3274/500000]
+ train/ActionL1Loss=0.0562
+ throughput/total_tokens=628,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3275/500000]
+ train/ActionL1Loss=0.0578
+ throughput/total_tokens=628,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3276/500000]
+ train/ActionL1Loss=0.0566
+ throughput/total_tokens=628,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3277/500000]
+ train/ActionL1Loss=0.0487
+ throughput/total_tokens=629,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3278/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=629,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3279/500000]
+ train/ActionL1Loss=0.0587
+ throughput/total_tokens=629,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3280/500000]
+ optim/total_grad_norm=9.158
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=629,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3281/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=629,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3282/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=630,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3283/500000]
+ train/ActionL1Loss=0.0477
+ throughput/total_tokens=630,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3284/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=630,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3285/500000]
+ train/ActionL1Loss=0.0615
+ throughput/total_tokens=630,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3286/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=630,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3287/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=631,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3288/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=631,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3289/500000]
+ train/ActionL1Loss=0.0535
+ throughput/total_tokens=631,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3290/500000]
+ train/ActionL1Loss=0.0595
+ throughput/total_tokens=631,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3291/500000]
+ train/ActionL1Loss=0.0527
+ throughput/total_tokens=631,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3292/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=632,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3293/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=632,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3294/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=632,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3295/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=632,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3296/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=632,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3297/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=633,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3298/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=633,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3299/500000]
+ train/ActionL1Loss=0.0611
+ throughput/total_tokens=633,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3300/500000]
+ optim/total_grad_norm=9.785
+ train/ActionL1Loss=0.0452
+ throughput/total_tokens=633,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3301/500000]
+ train/ActionL1Loss=0.0489
+ throughput/total_tokens=633,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3302/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=633,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3303/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=634,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3304/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=634,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3305/500000]
+ train/ActionL1Loss=0.0664
+ throughput/total_tokens=634,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3306/500000]
+ train/ActionL1Loss=0.0532
+ throughput/total_tokens=634,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3307/500000]
+ train/ActionL1Loss=0.0507
+ throughput/total_tokens=634,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3308/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=635,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3309/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=635,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3310/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=635,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3311/500000]
+ train/ActionL1Loss=0.0452
+ throughput/total_tokens=635,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3312/500000]
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=635,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3313/500000]
+ train/ActionL1Loss=0.0476
+ throughput/total_tokens=636,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3314/500000]
+ train/ActionL1Loss=0.0543
+ throughput/total_tokens=636,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3315/500000]
+ train/ActionL1Loss=0.0514
+ throughput/total_tokens=636,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3316/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=636,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3317/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=636,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3318/500000]
+ train/ActionL1Loss=0.0606
+ throughput/total_tokens=637,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3319/500000]
+ train/ActionL1Loss=0.0488
+ throughput/total_tokens=637,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3320/500000]
+ optim/total_grad_norm=8.032
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=637,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3321/500000]
+ train/ActionL1Loss=0.0468
+ throughput/total_tokens=637,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3322/500000]
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=637,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3323/500000]
+ train/ActionL1Loss=0.0486
+ throughput/total_tokens=638,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3324/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=638,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3325/500000]
+ train/ActionL1Loss=0.0544
+ throughput/total_tokens=638,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3326/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=638,592,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3327/500000]
+ train/ActionL1Loss=0.0595
+ throughput/total_tokens=638,784,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3328/500000]
+ train/ActionL1Loss=0.0519
+ throughput/total_tokens=638,976,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3329/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=639,168,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3330/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=639,360,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3331/500000]
+ train/ActionL1Loss=0.0535
+ throughput/total_tokens=639,552,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3332/500000]
+ train/ActionL1Loss=0.0462
+ throughput/total_tokens=639,744,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3333/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=639,936,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3334/500000]
+ train/ActionL1Loss=0.0629
+ throughput/total_tokens=640,128,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3335/500000]
+ train/ActionL1Loss=0.0538
+ throughput/total_tokens=640,320,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3336/500000]
+ train/ActionL1Loss=0.0553
+ throughput/total_tokens=640,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3337/500000]
+ train/ActionL1Loss=0.0506
+ throughput/total_tokens=640,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3338/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=640,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3339/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=641,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3340/500000]
+ optim/total_grad_norm=9.981
+ train/ActionL1Loss=0.0497
+ throughput/total_tokens=641,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3341/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=641,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3342/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=641,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3343/500000]
+ train/ActionL1Loss=0.0581
+ throughput/total_tokens=641,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3344/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=642,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3345/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=642,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3346/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=642,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3347/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=642,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3348/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=642,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3349/500000]
+ train/ActionL1Loss=0.0463
+ throughput/total_tokens=643,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3350/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=643,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3351/500000]
+ train/ActionL1Loss=0.0531
+ throughput/total_tokens=643,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3352/500000]
+ train/ActionL1Loss=0.0630
+ throughput/total_tokens=643,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3353/500000]
+ train/ActionL1Loss=0.0480
+ throughput/total_tokens=643,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3354/500000]
+ train/ActionL1Loss=0.0498
+ throughput/total_tokens=643,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3355/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=644,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3356/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=644,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3357/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=644,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3358/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=644,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3359/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=644,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3360/500000]
+ optim/total_grad_norm=9.305
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=645,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3361/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=645,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3362/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=645,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3363/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=645,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3364/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=645,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3365/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=646,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3366/500000]
+ train/ActionL1Loss=0.0602
+ throughput/total_tokens=646,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3367/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=646,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3368/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=646,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3369/500000]
+ train/ActionL1Loss=0.0534
+ throughput/total_tokens=646,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3370/500000]
+ train/ActionL1Loss=0.0657
+ throughput/total_tokens=647,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3371/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=647,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3372/500000]
+ train/ActionL1Loss=0.0518
+ throughput/total_tokens=647,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3373/500000]
+ train/ActionL1Loss=0.0582
+ throughput/total_tokens=647,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3374/500000]
+ train/ActionL1Loss=0.0553
+ throughput/total_tokens=647,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3375/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=648,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3376/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=648,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3377/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=648,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3378/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=648,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3379/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=648,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3380/500000]
+ optim/total_grad_norm=10.61
+ train/ActionL1Loss=0.0534
+ throughput/total_tokens=648,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3381/500000]
+ train/ActionL1Loss=0.0558
+ throughput/total_tokens=649,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3382/500000]
+ train/ActionL1Loss=0.0510
+ throughput/total_tokens=649,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3383/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=649,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3384/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=649,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3385/500000]
+ train/ActionL1Loss=0.0592
+ throughput/total_tokens=649,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=3386/500000]
+ train/ActionL1Loss=0.0515
+ throughput/total_tokens=650,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3387/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=650,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3388/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=650,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3389/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=650,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3390/500000]
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=650,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3391/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=651,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3392/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=651,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3393/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=651,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3394/500000]
+ train/ActionL1Loss=0.0458
+ throughput/total_tokens=651,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3395/500000]
+ train/ActionL1Loss=0.0486
+ throughput/total_tokens=651,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3396/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=652,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3397/500000]
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=652,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3398/500000]
+ train/ActionL1Loss=0.0541
+ throughput/total_tokens=652,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3399/500000]
+ train/ActionL1Loss=0.0609
+ throughput/total_tokens=652,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3400/500000]
+ optim/total_grad_norm=8.471
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=652,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3401/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=652,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3402/500000]
+ train/ActionL1Loss=0.0563
+ throughput/total_tokens=653,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3403/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=653,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3404/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=653,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3405/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=653,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3406/500000]
+ train/ActionL1Loss=0.0391
+ throughput/total_tokens=653,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3407/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=654,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3408/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=654,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3409/500000]
+ train/ActionL1Loss=0.0508
+ throughput/total_tokens=654,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3410/500000]
+ train/ActionL1Loss=0.0521
+ throughput/total_tokens=654,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3411/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=654,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3412/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=655,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3413/500000]
+ train/ActionL1Loss=0.0550
+ throughput/total_tokens=655,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3414/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=655,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3415/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=655,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3416/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=655,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3417/500000]
+ train/ActionL1Loss=0.0458
+ throughput/total_tokens=656,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3418/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=656,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3419/500000]
+ train/ActionL1Loss=0.0515
+ throughput/total_tokens=656,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3420/500000]
+ optim/total_grad_norm=8.846
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=656,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3421/500000]
+ train/ActionL1Loss=0.0471
+ throughput/total_tokens=656,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3422/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=657,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3423/500000]
+ train/ActionL1Loss=0.0502
+ throughput/total_tokens=657,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3424/500000]
+ train/ActionL1Loss=0.0525
+ throughput/total_tokens=657,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3425/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=657,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3426/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=657,792,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3427/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=657,984,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3428/500000]
+ train/ActionL1Loss=0.0499
+ throughput/total_tokens=658,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3429/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=658,368,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3430/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=658,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3431/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=658,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3432/500000]
+ train/ActionL1Loss=0.0532
+ throughput/total_tokens=658,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3433/500000]
+ train/ActionL1Loss=0.0478
+ throughput/total_tokens=659,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3434/500000]
+ train/ActionL1Loss=0.0535
+ throughput/total_tokens=659,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3435/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=659,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3436/500000]
+ train/ActionL1Loss=0.0502
+ throughput/total_tokens=659,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3437/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=659,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3438/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=660,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3439/500000]
+ train/ActionL1Loss=0.0541
+ throughput/total_tokens=660,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3440/500000]
+ optim/total_grad_norm=10.11
+ train/ActionL1Loss=0.0519
+ throughput/total_tokens=660,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3441/500000]
+ train/ActionL1Loss=0.0559
+ throughput/total_tokens=660,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3442/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=660,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3443/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=661,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3444/500000]
+ train/ActionL1Loss=0.0607
+ throughput/total_tokens=661,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3445/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=661,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3446/500000]
+ train/ActionL1Loss=0.0489
+ throughput/total_tokens=661,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3447/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=661,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3448/500000]
+ train/ActionL1Loss=0.0522
+ throughput/total_tokens=662,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3449/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=662,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3450/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=662,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3451/500000]
+ train/ActionL1Loss=0.0636
+ throughput/total_tokens=662,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3452/500000]
+ train/ActionL1Loss=0.0498
+ throughput/total_tokens=662,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3453/500000]
+ train/ActionL1Loss=0.0496
+ throughput/total_tokens=662,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3454/500000]
+ train/ActionL1Loss=0.0699
+ throughput/total_tokens=663,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3455/500000]
+ train/ActionL1Loss=0.0535
+ throughput/total_tokens=663,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3456/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=663,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3457/500000]
+ train/ActionL1Loss=0.0496
+ throughput/total_tokens=663,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3458/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=663,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3459/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=664,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3460/500000]
+ optim/total_grad_norm=9.761
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=664,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3461/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=664,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3462/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=664,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3463/500000]
+ train/ActionL1Loss=0.0492
+ throughput/total_tokens=664,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3464/500000]
+ train/ActionL1Loss=0.0559
+ throughput/total_tokens=665,088,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3465/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=665,280,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3466/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=665,472,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3467/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=665,664,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3468/500000]
+ train/ActionL1Loss=0.0499
+ throughput/total_tokens=665,856,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3469/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=666,048,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3470/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=666,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3471/500000]
+ train/ActionL1Loss=0.0391
+ throughput/total_tokens=666,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3472/500000]
+ train/ActionL1Loss=0.0482
+ throughput/total_tokens=666,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3473/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=666,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3474/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=667,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3475/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=667,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3476/500000]
+ train/ActionL1Loss=0.0521
+ throughput/total_tokens=667,392,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3477/500000]
+ train/ActionL1Loss=0.0493
+ throughput/total_tokens=667,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3478/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=667,776,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3479/500000]
+ train/ActionL1Loss=0.0560
+ throughput/total_tokens=667,968,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3480/500000]
+ optim/total_grad_norm=8.542
+ train/ActionL1Loss=0.0535
+ throughput/total_tokens=668,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3481/500000]
+ train/ActionL1Loss=0.0540
+ throughput/total_tokens=668,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3482/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=668,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3483/500000]
+ train/ActionL1Loss=0.0623
+ throughput/total_tokens=668,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3484/500000]
+ train/ActionL1Loss=0.0615
+ throughput/total_tokens=668,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3485/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=669,120,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3486/500000]
+ train/ActionL1Loss=0.0463
+ throughput/total_tokens=669,312,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3487/500000]
+ train/ActionL1Loss=0.0579
+ throughput/total_tokens=669,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3488/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=669,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3489/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=669,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3490/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=670,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3491/500000]
+ train/ActionL1Loss=0.0594
+ throughput/total_tokens=670,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3492/500000]
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=670,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3493/500000]
+ train/ActionL1Loss=0.0611
+ throughput/total_tokens=670,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3494/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=670,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3495/500000]
+ train/ActionL1Loss=0.0477
+ throughput/total_tokens=671,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3496/500000]
+ train/ActionL1Loss=0.0493
+ throughput/total_tokens=671,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3497/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=671,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3498/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=671,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3499/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=671,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3500/500000]
+ optim/total_grad_norm=7.923
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=672,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+10/03 [12:50:14] INFO | >> Saving config... checkpoint.py:608
+10/03 [12:51:06] INFO | >> Saving model state... checkpoint.py:796
+10/03 [12:52:17] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [12:53:46] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3501/500000]
+ train/ActionL1Loss=0.0533
+ throughput/total_tokens=672,192,000
+ throughput/device/tokens_per_second=1,215
+ throughput/device/batches_per_second=0.0506
+[step=3502/500000]
+ train/ActionL1Loss=0.0480
+ throughput/total_tokens=672,384,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=3503/500000]
+ train/ActionL1Loss=0.0526
+ throughput/total_tokens=672,576,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=3504/500000]
+ train/ActionL1Loss=0.0465
+ throughput/total_tokens=672,768,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=3505/500000]
+ train/ActionL1Loss=0.0508
+ throughput/total_tokens=672,960,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=3506/500000]
+ train/ActionL1Loss=0.0479
+ throughput/total_tokens=673,152,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=3507/500000]
+ train/ActionL1Loss=0.0509
+ throughput/total_tokens=673,344,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=3508/500000]
+ train/ActionL1Loss=0.0539
+ throughput/total_tokens=673,536,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=3509/500000]
+ train/ActionL1Loss=0.0534
+ throughput/total_tokens=673,728,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=3510/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=673,920,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=3511/500000]
+ train/ActionL1Loss=0.0533
+ throughput/total_tokens=674,112,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=3512/500000]
+ train/ActionL1Loss=0.0486
+ throughput/total_tokens=674,304,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=3513/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=674,496,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=3514/500000]
+ train/ActionL1Loss=0.0596
+ throughput/total_tokens=674,688,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=3515/500000]
+ train/ActionL1Loss=0.0749
+ throughput/total_tokens=674,880,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=3516/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=675,072,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3517/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=675,264,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3518/500000]
+ train/ActionL1Loss=0.0506
+ throughput/total_tokens=675,456,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3519/500000]
+ train/ActionL1Loss=0.0543
+ throughput/total_tokens=675,648,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3520/500000]
+ optim/total_grad_norm=7.662
+ train/ActionL1Loss=0.0541
+ throughput/total_tokens=675,840,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3521/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=676,032,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3522/500000]
+ train/ActionL1Loss=0.0509
+ throughput/total_tokens=676,224,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3523/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=676,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3524/500000]
+ train/ActionL1Loss=0.0496
+ throughput/total_tokens=676,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3525/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=676,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3526/500000]
+ train/ActionL1Loss=0.0507
+ throughput/total_tokens=676,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3527/500000]
+ train/ActionL1Loss=0.0538
+ throughput/total_tokens=677,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3528/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=677,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3529/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=677,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3530/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=677,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3531/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=677,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3532/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=678,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3533/500000]
+ train/ActionL1Loss=0.0535
+ throughput/total_tokens=678,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3534/500000]
+ train/ActionL1Loss=0.0471
+ throughput/total_tokens=678,528,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3535/500000]
+ train/ActionL1Loss=0.0480
+ throughput/total_tokens=678,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3536/500000]
+ train/ActionL1Loss=0.0479
+ throughput/total_tokens=678,912,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3537/500000]
+ train/ActionL1Loss=0.0532
+ throughput/total_tokens=679,104,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3538/500000]
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=679,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3539/500000]
+ train/ActionL1Loss=0.0552
+ throughput/total_tokens=679,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3540/500000]
+ optim/total_grad_norm=7.349
+ train/ActionL1Loss=0.0480
+ throughput/total_tokens=679,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3541/500000]
+ train/ActionL1Loss=0.0552
+ throughput/total_tokens=679,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3542/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=680,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3543/500000]
+ train/ActionL1Loss=0.0575
+ throughput/total_tokens=680,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3544/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=680,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3545/500000]
+ train/ActionL1Loss=0.0538
+ throughput/total_tokens=680,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3546/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=680,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3547/500000]
+ train/ActionL1Loss=0.0485
+ throughput/total_tokens=681,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3548/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=681,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3549/500000]
+ train/ActionL1Loss=0.0433
+ throughput/total_tokens=681,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3550/500000]
+ train/ActionL1Loss=0.0542
+ throughput/total_tokens=681,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3551/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=681,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3552/500000]
+ train/ActionL1Loss=0.0412
+ throughput/total_tokens=681,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3553/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=682,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3554/500000]
+ train/ActionL1Loss=0.0531
+ throughput/total_tokens=682,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3555/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=682,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3556/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=682,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3557/500000]
+ train/ActionL1Loss=0.0549
+ throughput/total_tokens=682,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3558/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=683,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3559/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=683,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3560/500000]
+ optim/total_grad_norm=9.439
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=683,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3561/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=683,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3562/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=683,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3563/500000]
+ train/ActionL1Loss=0.0495
+ throughput/total_tokens=684,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3564/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=684,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3565/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=684,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3566/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=684,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3567/500000]
+ train/ActionL1Loss=0.0566
+ throughput/total_tokens=684,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3568/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=685,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3569/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=685,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3570/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=685,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3571/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=685,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3572/500000]
+ train/ActionL1Loss=0.0432
+ throughput/total_tokens=685,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3573/500000]
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=686,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3574/500000]
+ train/ActionL1Loss=0.0404
+ throughput/total_tokens=686,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3575/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=686,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3576/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=686,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3577/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=686,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3578/500000]
+ train/ActionL1Loss=0.0493
+ throughput/total_tokens=686,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3579/500000]
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=687,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3580/500000]
+ optim/total_grad_norm=7.748
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=687,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3581/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=687,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3582/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=687,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3583/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=687,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3584/500000]
+ train/ActionL1Loss=0.0505
+ throughput/total_tokens=688,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3585/500000]
+ train/ActionL1Loss=0.0463
+ throughput/total_tokens=688,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3586/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=688,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3587/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=688,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3588/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=688,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3589/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=689,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3590/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=689,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3591/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=689,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3592/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=689,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3593/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=689,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3594/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=690,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3595/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=690,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3596/500000]
+ train/ActionL1Loss=0.0596
+ throughput/total_tokens=690,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3597/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=690,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3598/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=690,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3599/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=691,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3600/500000]
+ optim/total_grad_norm=8.740
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=691,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3601/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=691,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3602/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=691,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3603/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=691,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3604/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=691,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3605/500000]
+ train/ActionL1Loss=0.0547
+ throughput/total_tokens=692,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3606/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=692,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3607/500000]
+ train/ActionL1Loss=0.0550
+ throughput/total_tokens=692,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3608/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=692,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3609/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=692,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3610/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=693,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3611/500000]
+ train/ActionL1Loss=0.0564
+ throughput/total_tokens=693,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3612/500000]
+ train/ActionL1Loss=0.0563
+ throughput/total_tokens=693,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3613/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=693,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3614/500000]
+ train/ActionL1Loss=0.0519
+ throughput/total_tokens=693,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3615/500000]
+ train/ActionL1Loss=0.0795
+ throughput/total_tokens=694,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3616/500000]
+ train/ActionL1Loss=0.0500
+ throughput/total_tokens=694,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3617/500000]
+ train/ActionL1Loss=0.0400
+ throughput/total_tokens=694,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3618/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=694,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3619/500000]
+ train/ActionL1Loss=0.0493
+ throughput/total_tokens=694,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3620/500000]
+ optim/total_grad_norm=9.555
+ train/ActionL1Loss=0.0522
+ throughput/total_tokens=695,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3621/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=695,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3622/500000]
+ train/ActionL1Loss=0.0477
+ throughput/total_tokens=695,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3623/500000]
+ train/ActionL1Loss=0.0470
+ throughput/total_tokens=695,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3624/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=695,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3625/500000]
+ train/ActionL1Loss=0.0657
+ throughput/total_tokens=696,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3626/500000]
+ train/ActionL1Loss=0.0499
+ throughput/total_tokens=696,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3627/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=696,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3628/500000]
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=696,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3629/500000]
+ train/ActionL1Loss=0.0465
+ throughput/total_tokens=696,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3630/500000]
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=696,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3631/500000]
+ train/ActionL1Loss=0.0514
+ throughput/total_tokens=697,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3632/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=697,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3633/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=697,536,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3634/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=697,728,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3635/500000]
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=697,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3636/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=698,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3637/500000]
+ train/ActionL1Loss=0.0548
+ throughput/total_tokens=698,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3638/500000]
+ train/ActionL1Loss=0.0519
+ throughput/total_tokens=698,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3639/500000]
+ train/ActionL1Loss=0.0498
+ throughput/total_tokens=698,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3640/500000]
+ optim/total_grad_norm=10.44
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=698,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3641/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=699,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3642/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=699,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3643/500000]
+ train/ActionL1Loss=0.0556
+ throughput/total_tokens=699,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3644/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=699,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3645/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=699,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3646/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=700,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3647/500000]
+ train/ActionL1Loss=0.0410
+ throughput/total_tokens=700,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3648/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=700,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3649/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=700,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3650/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=700,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3651/500000]
+ train/ActionL1Loss=0.0555
+ throughput/total_tokens=700,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3652/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=701,184,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3653/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=701,376,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3654/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=701,568,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3655/500000]
+ train/ActionL1Loss=0.0365
+ throughput/total_tokens=701,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3656/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=701,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3657/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=702,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3658/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=702,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3659/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=702,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3660/500000]
+ optim/total_grad_norm=9.078
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=702,720,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3661/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=702,912,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3662/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=703,104,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3663/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=703,296,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3664/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=703,488,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3665/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=703,680,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3666/500000]
+ train/ActionL1Loss=0.0463
+ throughput/total_tokens=703,872,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3667/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=704,064,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3668/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=704,256,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3669/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=704,448,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3670/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=704,640,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3671/500000]
+ train/ActionL1Loss=0.0485
+ throughput/total_tokens=704,832,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3672/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=705,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3673/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=705,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3674/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=705,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3675/500000]
+ train/ActionL1Loss=0.0482
+ throughput/total_tokens=705,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3676/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=705,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3677/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=705,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3678/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=706,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3679/500000]
+ train/ActionL1Loss=0.0508
+ throughput/total_tokens=706,368,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3680/500000]
+ optim/total_grad_norm=9.951
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=706,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3681/500000]
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=706,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3682/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=706,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3683/500000]
+ train/ActionL1Loss=0.0531
+ throughput/total_tokens=707,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3684/500000]
+ train/ActionL1Loss=0.0552
+ throughput/total_tokens=707,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3685/500000]
+ train/ActionL1Loss=0.0433
+ throughput/total_tokens=707,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3686/500000]
+ train/ActionL1Loss=0.0462
+ throughput/total_tokens=707,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3687/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=707,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3688/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=708,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3689/500000]
+ train/ActionL1Loss=0.0452
+ throughput/total_tokens=708,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3690/500000]
+ train/ActionL1Loss=0.0526
+ throughput/total_tokens=708,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3691/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=708,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3692/500000]
+ train/ActionL1Loss=0.0604
+ throughput/total_tokens=708,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3693/500000]
+ train/ActionL1Loss=0.0496
+ throughput/total_tokens=709,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3694/500000]
+ train/ActionL1Loss=0.0513
+ throughput/total_tokens=709,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3695/500000]
+ train/ActionL1Loss=0.0489
+ throughput/total_tokens=709,440,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3696/500000]
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=709,632,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3697/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=709,824,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3698/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=710,016,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3699/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=710,208,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3700/500000]
+ optim/total_grad_norm=8.280
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=710,400,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3701/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=710,592,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3702/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=710,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3703/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=710,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3704/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=711,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3705/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=711,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3706/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=711,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3707/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=711,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3708/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=711,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3709/500000]
+ train/ActionL1Loss=0.0500
+ throughput/total_tokens=712,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3710/500000]
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=712,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3711/500000]
+ train/ActionL1Loss=0.0492
+ throughput/total_tokens=712,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3712/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=712,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3713/500000]
+ train/ActionL1Loss=0.0471
+ throughput/total_tokens=712,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3714/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=713,088,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3715/500000]
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=713,280,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3716/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=713,472,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3717/500000]
+ train/ActionL1Loss=0.0365
+ throughput/total_tokens=713,664,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3718/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=713,856,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3719/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=714,048,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3720/500000]
+ optim/total_grad_norm=9.227
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=714,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3721/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=714,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3722/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=714,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3723/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=714,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3724/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=715,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3725/500000]
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=715,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3726/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=715,392,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3727/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=715,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3728/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=715,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3729/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=715,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3730/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=716,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3731/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=716,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3732/500000]
+ train/ActionL1Loss=0.0488
+ throughput/total_tokens=716,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3733/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=716,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3734/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=716,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3735/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=717,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3736/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=717,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3737/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=717,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3738/500000]
+ train/ActionL1Loss=0.0476
+ throughput/total_tokens=717,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3739/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=717,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3740/500000]
+ optim/total_grad_norm=9.749
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=718,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3741/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=718,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3742/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=718,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3743/500000]
+ train/ActionL1Loss=0.0522
+ throughput/total_tokens=718,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3744/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=718,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3745/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=719,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3746/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=719,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3747/500000]
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=719,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3748/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=719,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3749/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=719,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3750/500000]
+ train/ActionL1Loss=0.0607
+ throughput/total_tokens=720,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3751/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=720,192,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3752/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=720,384,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3753/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=720,576,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3754/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=720,768,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3755/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=720,960,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3756/500000]
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=721,152,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3757/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=721,344,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3758/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=721,536,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3759/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=721,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3760/500000]
+ optim/total_grad_norm=8.763
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=721,920,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3761/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=722,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3762/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=722,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3763/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=722,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3764/500000]
+ train/ActionL1Loss=0.0477
+ throughput/total_tokens=722,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3765/500000]
+ train/ActionL1Loss=0.0508
+ throughput/total_tokens=722,880,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3766/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=723,072,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3767/500000]
+ train/ActionL1Loss=0.0476
+ throughput/total_tokens=723,264,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3768/500000]
+ train/ActionL1Loss=0.0410
+ throughput/total_tokens=723,456,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3769/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=723,648,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3770/500000]
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=723,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3771/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=724,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3772/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=724,224,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3773/500000]
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=724,416,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3774/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=724,608,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3775/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=724,800,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3776/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=724,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3777/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=725,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3778/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=725,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3779/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=725,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3780/500000]
+ optim/total_grad_norm=8.965
+ train/ActionL1Loss=0.0433
+ throughput/total_tokens=725,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3781/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=725,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3782/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=726,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3783/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=726,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3784/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=726,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3785/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=726,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3786/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=726,912,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3787/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=727,104,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3788/500000]
+ train/ActionL1Loss=0.0359
+ throughput/total_tokens=727,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3789/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=727,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3790/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=727,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3791/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=727,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3792/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=728,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3793/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=728,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3794/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=728,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3795/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=728,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3796/500000]
+ train/ActionL1Loss=0.0400
+ throughput/total_tokens=728,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3797/500000]
+ train/ActionL1Loss=0.0492
+ throughput/total_tokens=729,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3798/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=729,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3799/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=729,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3800/500000]
+ optim/total_grad_norm=8.842
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=729,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3801/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=729,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3802/500000]
+ train/ActionL1Loss=0.0462
+ throughput/total_tokens=729,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3803/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=730,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3804/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=730,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3805/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=730,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3806/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=730,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3807/500000]
+ train/ActionL1Loss=0.0465
+ throughput/total_tokens=730,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3808/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=731,136,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3809/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=731,328,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3810/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=731,520,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3811/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=731,712,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3812/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=731,904,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3813/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=732,096,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3814/500000]
+ train/ActionL1Loss=0.0458
+ throughput/total_tokens=732,288,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3815/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=732,480,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3816/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=732,672,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3817/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=732,864,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3818/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=733,056,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3819/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=733,248,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3820/500000]
+ optim/total_grad_norm=8.724
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=733,440,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3821/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=733,632,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3822/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=733,824,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3823/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=734,016,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3824/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=734,208,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3825/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=734,400,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3826/500000]
+ train/ActionL1Loss=0.0391
+ throughput/total_tokens=734,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3827/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=734,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3828/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=734,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3829/500000]
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=735,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3830/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=735,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3831/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=735,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3832/500000]
+ train/ActionL1Loss=0.0462
+ throughput/total_tokens=735,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3833/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=735,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3834/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=736,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3835/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=736,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3836/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=736,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3837/500000]
+ train/ActionL1Loss=0.0412
+ throughput/total_tokens=736,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3838/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=736,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3839/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=737,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3840/500000]
+ optim/total_grad_norm=7.293
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=737,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3841/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=737,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3842/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=737,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3843/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=737,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3844/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=738,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3845/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=738,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=3846/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=738,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3847/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=738,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3848/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=738,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3849/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=739,008,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3850/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=739,200,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3851/500000]
+ train/ActionL1Loss=0.0484
+ throughput/total_tokens=739,392,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3852/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=739,584,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3853/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=739,776,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3854/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=739,968,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3855/500000]
+ train/ActionL1Loss=0.0479
+ throughput/total_tokens=740,160,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3856/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=740,352,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3857/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=740,544,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3858/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=740,736,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3859/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=740,928,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3860/500000]
+ optim/total_grad_norm=9.162
+ train/ActionL1Loss=0.0471
+ throughput/total_tokens=741,120,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3861/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=741,312,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3862/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=741,504,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=3863/500000]
+ train/ActionL1Loss=0.0391
+ throughput/total_tokens=741,696,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=3864/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=741,888,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=3865/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=742,080,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=3866/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=742,272,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=3867/500000]
+ train/ActionL1Loss=0.0544
+ throughput/total_tokens=742,464,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=3868/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=742,656,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=3869/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=742,848,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=3870/500000]
+ train/ActionL1Loss=0.0413
+ throughput/total_tokens=743,040,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3871/500000]
+ train/ActionL1Loss=0.0444
+ throughput/total_tokens=743,232,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3872/500000]
+ train/ActionL1Loss=0.0647
+ throughput/total_tokens=743,424,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3873/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=743,616,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3874/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=743,808,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3875/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=744,000,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3876/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=744,192,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3877/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=744,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3878/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=744,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3879/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=744,768,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3880/500000]
+ optim/total_grad_norm=8.511
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=744,960,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3881/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=745,152,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3882/500000]
+ train/ActionL1Loss=0.0400
+ throughput/total_tokens=745,344,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=3883/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=745,536,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=3884/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=745,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3885/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=745,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3886/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=746,112,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3887/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=746,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3888/500000]
+ train/ActionL1Loss=0.0587
+ throughput/total_tokens=746,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3889/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=746,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3890/500000]
+ train/ActionL1Loss=0.0525
+ throughput/total_tokens=746,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3891/500000]
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=747,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3892/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=747,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3893/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=747,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3894/500000]
+ train/ActionL1Loss=0.0515
+ throughput/total_tokens=747,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3895/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=747,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3896/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=748,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3897/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=748,224,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3898/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=748,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3899/500000]
+ train/ActionL1Loss=0.0493
+ throughput/total_tokens=748,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3900/500000]
+ optim/total_grad_norm=9.013
+ train/ActionL1Loss=0.0478
+ throughput/total_tokens=748,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3901/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=748,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3902/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=749,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3903/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=749,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3904/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=749,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3905/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=749,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3906/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=749,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3907/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=750,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3908/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=750,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3909/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=750,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3910/500000]
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=750,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3911/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=750,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3912/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=751,104,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3913/500000]
+ train/ActionL1Loss=0.0412
+ throughput/total_tokens=751,296,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3914/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=751,488,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3915/500000]
+ train/ActionL1Loss=0.0495
+ throughput/total_tokens=751,680,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3916/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=751,872,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3917/500000]
+ train/ActionL1Loss=0.0540
+ throughput/total_tokens=752,064,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3918/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=752,256,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3919/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=752,448,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3920/500000]
+ optim/total_grad_norm=7.799
+ train/ActionL1Loss=0.0571
+ throughput/total_tokens=752,640,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3921/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=752,832,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3922/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=753,024,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3923/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=753,216,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3924/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=753,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3925/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=753,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3926/500000]
+ train/ActionL1Loss=0.0804
+ throughput/total_tokens=753,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3927/500000]
+ train/ActionL1Loss=0.0510
+ throughput/total_tokens=753,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3928/500000]
+ train/ActionL1Loss=0.0609
+ throughput/total_tokens=754,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3929/500000]
+ train/ActionL1Loss=0.0514
+ throughput/total_tokens=754,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3930/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=754,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3931/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=754,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3932/500000]
+ train/ActionL1Loss=0.1055
+ throughput/total_tokens=754,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3933/500000]
+ train/ActionL1Loss=0.0992
+ throughput/total_tokens=755,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3934/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=755,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3935/500000]
+ train/ActionL1Loss=0.0977
+ throughput/total_tokens=755,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3936/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=755,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3937/500000]
+ train/ActionL1Loss=0.1006
+ throughput/total_tokens=755,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3938/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=756,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3939/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=756,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3940/500000]
+ optim/total_grad_norm=8.094
+ train/ActionL1Loss=0.0889
+ throughput/total_tokens=756,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3941/500000]
+ train/ActionL1Loss=0.0544
+ throughput/total_tokens=756,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3942/500000]
+ train/ActionL1Loss=0.0601
+ throughput/total_tokens=756,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3943/500000]
+ train/ActionL1Loss=0.0578
+ throughput/total_tokens=757,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3944/500000]
+ train/ActionL1Loss=0.0512
+ throughput/total_tokens=757,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3945/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=757,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3946/500000]
+ train/ActionL1Loss=0.0581
+ throughput/total_tokens=757,632,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3947/500000]
+ train/ActionL1Loss=0.0470
+ throughput/total_tokens=757,824,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3948/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=758,016,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3949/500000]
+ train/ActionL1Loss=0.0494
+ throughput/total_tokens=758,208,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3950/500000]
+ train/ActionL1Loss=0.0566
+ throughput/total_tokens=758,400,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3951/500000]
+ train/ActionL1Loss=0.0593
+ throughput/total_tokens=758,592,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3952/500000]
+ train/ActionL1Loss=0.0487
+ throughput/total_tokens=758,784,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3953/500000]
+ train/ActionL1Loss=0.0610
+ throughput/total_tokens=758,976,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3954/500000]
+ train/ActionL1Loss=0.0689
+ throughput/total_tokens=759,168,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3955/500000]
+ train/ActionL1Loss=0.0569
+ throughput/total_tokens=759,360,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3956/500000]
+ train/ActionL1Loss=0.0509
+ throughput/total_tokens=759,552,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3957/500000]
+ train/ActionL1Loss=0.0513
+ throughput/total_tokens=759,744,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3958/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=759,936,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3959/500000]
+ train/ActionL1Loss=0.0511
+ throughput/total_tokens=760,128,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3960/500000]
+ optim/total_grad_norm=8.995
+ train/ActionL1Loss=0.0482
+ throughput/total_tokens=760,320,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=3961/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=760,512,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3962/500000]
+ train/ActionL1Loss=0.0471
+ throughput/total_tokens=760,704,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3963/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=760,896,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3964/500000]
+ train/ActionL1Loss=0.0555
+ throughput/total_tokens=761,088,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3965/500000]
+ train/ActionL1Loss=0.0462
+ throughput/total_tokens=761,280,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3966/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=761,472,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3967/500000]
+ train/ActionL1Loss=0.0648
+ throughput/total_tokens=761,664,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=3968/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=761,856,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3969/500000]
+ train/ActionL1Loss=0.0598
+ throughput/total_tokens=762,048,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=3970/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=762,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3971/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=762,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3972/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=762,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3973/500000]
+ train/ActionL1Loss=0.0523
+ throughput/total_tokens=762,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3974/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=763,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3975/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=763,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3976/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=763,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3977/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=763,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3978/500000]
+ train/ActionL1Loss=0.0624
+ throughput/total_tokens=763,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3979/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=763,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=3980/500000]
+ optim/total_grad_norm=7.344
+ train/ActionL1Loss=0.0444
+ throughput/total_tokens=764,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=3981/500000]
+ train/ActionL1Loss=0.0506
+ throughput/total_tokens=764,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3982/500000]
+ train/ActionL1Loss=0.0465
+ throughput/total_tokens=764,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3983/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=764,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3984/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=764,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3985/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=765,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3986/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=765,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3987/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=765,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3988/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=765,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3989/500000]
+ train/ActionL1Loss=0.0564
+ throughput/total_tokens=765,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3990/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=766,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=3991/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=766,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3992/500000]
+ train/ActionL1Loss=0.0444
+ throughput/total_tokens=766,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3993/500000]
+ train/ActionL1Loss=0.0537
+ throughput/total_tokens=766,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3994/500000]
+ train/ActionL1Loss=0.0458
+ throughput/total_tokens=766,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=3995/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=767,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3996/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=767,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3997/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=767,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3998/500000]
+ train/ActionL1Loss=0.0591
+ throughput/total_tokens=767,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=3999/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=767,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4000/500000]
+ optim/total_grad_norm=8.327
+ train/ActionL1Loss=0.0488
+ throughput/total_tokens=768,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+10/03 [15:43:59] INFO | >> Saving config... checkpoint.py:608
+10/03 [15:45:01] INFO | >> Saving model state... checkpoint.py:796
+10/03 [15:46:12] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [15:47:41] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4001/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=768,192,000
+ throughput/device/tokens_per_second=1,223
+ throughput/device/batches_per_second=0.0510
+[step=4002/500000]
+ train/ActionL1Loss=0.0675
+ throughput/total_tokens=768,384,000
+ throughput/device/tokens_per_second=1,201
+ throughput/device/batches_per_second=0.0501
+[step=4003/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=768,576,000
+ throughput/device/tokens_per_second=1,194
+ throughput/device/batches_per_second=0.0498
+[step=4004/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=768,768,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=4005/500000]
+ train/ActionL1Loss=0.0504
+ throughput/total_tokens=768,960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4006/500000]
+ train/ActionL1Loss=0.0665
+ throughput/total_tokens=769,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4007/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=769,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4008/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=769,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4009/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=769,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4010/500000]
+ train/ActionL1Loss=0.0597
+ throughput/total_tokens=769,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4011/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=770,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4012/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=770,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4013/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=770,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4014/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=770,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4015/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=770,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4016/500000]
+ train/ActionL1Loss=0.0486
+ throughput/total_tokens=771,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4017/500000]
+ train/ActionL1Loss=0.0432
+ throughput/total_tokens=771,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4018/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=771,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4019/500000]
+ train/ActionL1Loss=0.0400
+ throughput/total_tokens=771,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4020/500000]
+ optim/total_grad_norm=8.060
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=771,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4021/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=772,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4022/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=772,224,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4023/500000]
+ train/ActionL1Loss=0.0462
+ throughput/total_tokens=772,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4024/500000]
+ train/ActionL1Loss=0.0503
+ throughput/total_tokens=772,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4025/500000]
+ train/ActionL1Loss=0.0536
+ throughput/total_tokens=772,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4026/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=772,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4027/500000]
+ train/ActionL1Loss=0.0514
+ throughput/total_tokens=773,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4028/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=773,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4029/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=773,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4030/500000]
+ train/ActionL1Loss=0.0497
+ throughput/total_tokens=773,760,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4031/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=773,952,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4032/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=774,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4033/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=774,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4034/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=774,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4035/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=774,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4036/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=774,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4037/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=775,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4038/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=775,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4039/500000]
+ train/ActionL1Loss=0.0487
+ throughput/total_tokens=775,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4040/500000]
+ optim/total_grad_norm=8.250
+ train/ActionL1Loss=0.0508
+ throughput/total_tokens=775,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4041/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=775,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4042/500000]
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=776,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4043/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=776,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4044/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=776,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4045/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=776,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4046/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=776,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4047/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=777,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4048/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=777,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4049/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=777,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4050/500000]
+ train/ActionL1Loss=0.0465
+ throughput/total_tokens=777,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4051/500000]
+ train/ActionL1Loss=0.0536
+ throughput/total_tokens=777,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4052/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=777,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4053/500000]
+ train/ActionL1Loss=0.0533
+ throughput/total_tokens=778,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4054/500000]
+ train/ActionL1Loss=0.0555
+ throughput/total_tokens=778,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4055/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=778,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4056/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=778,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4057/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=778,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4058/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=779,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4059/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=779,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4060/500000]
+ optim/total_grad_norm=6.219
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=779,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=4061/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=779,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4062/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=779,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4063/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=780,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4064/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=780,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4065/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=780,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4066/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=780,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4067/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=780,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4068/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=781,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4069/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=781,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4070/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=781,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4071/500000]
+ train/ActionL1Loss=0.0400
+ throughput/total_tokens=781,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4072/500000]
+ train/ActionL1Loss=0.0527
+ throughput/total_tokens=781,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4073/500000]
+ train/ActionL1Loss=0.0507
+ throughput/total_tokens=782,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4074/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=782,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4075/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=782,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4076/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=782,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4077/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=782,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4078/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=782,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4079/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=783,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4080/500000]
+ optim/total_grad_norm=7.735
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=783,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4081/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=783,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4082/500000]
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=783,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4083/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=783,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4084/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=784,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4085/500000]
+ train/ActionL1Loss=0.0476
+ throughput/total_tokens=784,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4086/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=784,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4087/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=784,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4088/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=784,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4089/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=785,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4090/500000]
+ train/ActionL1Loss=0.0458
+ throughput/total_tokens=785,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4091/500000]
+ train/ActionL1Loss=0.0546
+ throughput/total_tokens=785,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4092/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=785,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4093/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=785,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4094/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=786,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4095/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=786,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4096/500000]
+ train/ActionL1Loss=0.0468
+ throughput/total_tokens=786,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4097/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=786,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4098/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=786,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4099/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=787,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4100/500000]
+ optim/total_grad_norm=9.569
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=787,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4101/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=787,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4102/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=787,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4103/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=787,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4104/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=787,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4105/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=788,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4106/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=788,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4107/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=788,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4108/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=788,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4109/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=788,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4110/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=789,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4111/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=789,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4112/500000]
+ train/ActionL1Loss=0.0508
+ throughput/total_tokens=789,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4113/500000]
+ train/ActionL1Loss=0.0488
+ throughput/total_tokens=789,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4114/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=789,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4115/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=790,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4116/500000]
+ train/ActionL1Loss=0.0468
+ throughput/total_tokens=790,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4117/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=790,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4118/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=790,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4119/500000]
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=790,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4120/500000]
+ optim/total_grad_norm=8.549
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=791,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4121/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=791,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4122/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=791,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4123/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=791,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4124/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=791,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4125/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=792,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4126/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=792,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4127/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=792,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4128/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=792,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4129/500000]
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=792,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4130/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=792,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4131/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=793,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4132/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=793,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4133/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=793,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4134/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=793,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4135/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=793,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4136/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=794,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4137/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=794,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4138/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=794,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4139/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=794,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4140/500000]
+ optim/total_grad_norm=6.566
+ train/ActionL1Loss=0.0432
+ throughput/total_tokens=794,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4141/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=795,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4142/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=795,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4143/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=795,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4144/500000]
+ train/ActionL1Loss=0.0359
+ throughput/total_tokens=795,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4145/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=795,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4146/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=796,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4147/500000]
+ train/ActionL1Loss=0.0432
+ throughput/total_tokens=796,224,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4148/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=796,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4149/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=796,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4150/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=796,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4151/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=796,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4152/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=797,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4153/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=797,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4154/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=797,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4155/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=797,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4156/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=797,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4157/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=798,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4158/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=798,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4159/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=798,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4160/500000]
+ optim/total_grad_norm=8.089
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=798,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4161/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=798,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4162/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=799,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4163/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=799,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4164/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=799,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4165/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=799,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4166/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=799,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4167/500000]
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=800,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4168/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=800,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4169/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=800,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4170/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=800,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4171/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=800,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4172/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=801,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4173/500000]
+ train/ActionL1Loss=0.0452
+ throughput/total_tokens=801,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4174/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=801,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4175/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=801,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4176/500000]
+ train/ActionL1Loss=0.0497
+ throughput/total_tokens=801,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4177/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=801,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4178/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=802,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4179/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=802,368,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4180/500000]
+ optim/total_grad_norm=7.487
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=802,560,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4181/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=802,752,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4182/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=802,944,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4183/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=803,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4184/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=803,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4185/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=803,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4186/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=803,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4187/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=803,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4188/500000]
+ train/ActionL1Loss=0.0493
+ throughput/total_tokens=804,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4189/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=804,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4190/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=804,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4191/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=804,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4192/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=804,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4193/500000]
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=805,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4194/500000]
+ train/ActionL1Loss=0.0522
+ throughput/total_tokens=805,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4195/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=805,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4196/500000]
+ train/ActionL1Loss=0.0519
+ throughput/total_tokens=805,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4197/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=805,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4198/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=806,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4199/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=806,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4200/500000]
+ optim/total_grad_norm=7.135
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=806,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4201/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=806,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4202/500000]
+ train/ActionL1Loss=0.0533
+ throughput/total_tokens=806,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4203/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=806,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4204/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=807,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4205/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=807,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4206/500000]
+ train/ActionL1Loss=0.0450
+ throughput/total_tokens=807,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4207/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=807,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4208/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=807,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4209/500000]
+ train/ActionL1Loss=0.0404
+ throughput/total_tokens=808,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4210/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=808,320,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4211/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=808,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4212/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=808,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4213/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=808,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4214/500000]
+ train/ActionL1Loss=0.0452
+ throughput/total_tokens=809,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4215/500000]
+ train/ActionL1Loss=0.0492
+ throughput/total_tokens=809,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4216/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=809,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4217/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=809,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4218/500000]
+ train/ActionL1Loss=0.0471
+ throughput/total_tokens=809,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4219/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=810,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4220/500000]
+ optim/total_grad_norm=7.853
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=810,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4221/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=810,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4222/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=810,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4223/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=810,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4224/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=811,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4225/500000]
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=811,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4226/500000]
+ train/ActionL1Loss=0.0433
+ throughput/total_tokens=811,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4227/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=811,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4228/500000]
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=811,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4229/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=811,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4230/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=812,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4231/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=812,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4232/500000]
+ train/ActionL1Loss=0.0359
+ throughput/total_tokens=812,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4233/500000]
+ train/ActionL1Loss=0.0558
+ throughput/total_tokens=812,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4234/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=812,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4235/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=813,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4236/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=813,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4237/500000]
+ train/ActionL1Loss=0.0433
+ throughput/total_tokens=813,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4238/500000]
+ train/ActionL1Loss=0.0538
+ throughput/total_tokens=813,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4239/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=813,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4240/500000]
+ optim/total_grad_norm=8.060
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=814,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4241/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=814,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4242/500000]
+ train/ActionL1Loss=0.0654
+ throughput/total_tokens=814,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4243/500000]
+ train/ActionL1Loss=0.0570
+ throughput/total_tokens=814,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4244/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=814,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4245/500000]
+ train/ActionL1Loss=0.0508
+ throughput/total_tokens=815,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4246/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=815,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4247/500000]
+ train/ActionL1Loss=0.0561
+ throughput/total_tokens=815,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4248/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=815,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4249/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=815,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4250/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=816,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4251/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=816,192,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4252/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=816,384,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4253/500000]
+ train/ActionL1Loss=0.0558
+ throughput/total_tokens=816,576,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4254/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=816,768,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4255/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=816,960,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4256/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=817,152,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4257/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=817,344,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4258/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=817,536,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4259/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=817,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4260/500000]
+ optim/total_grad_norm=9.996
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=817,920,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=4261/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=818,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4262/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=818,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4263/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=818,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4264/500000]
+ train/ActionL1Loss=0.0470
+ throughput/total_tokens=818,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4265/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=818,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4266/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=819,072,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4267/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=819,264,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4268/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=819,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4269/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=819,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4270/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=819,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4271/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=820,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4272/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=820,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4273/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=820,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4274/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=820,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4275/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=820,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4276/500000]
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=820,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4277/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=821,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4278/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=821,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4279/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=821,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4280/500000]
+ optim/total_grad_norm=10.76
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=821,760,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4281/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=821,952,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4282/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=822,144,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4283/500000]
+ train/ActionL1Loss=0.0591
+ throughput/total_tokens=822,336,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4284/500000]
+ train/ActionL1Loss=0.0572
+ throughput/total_tokens=822,528,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4285/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=822,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4286/500000]
+ train/ActionL1Loss=0.0492
+ throughput/total_tokens=822,912,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4287/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=823,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4288/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=823,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4289/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=823,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4290/500000]
+ train/ActionL1Loss=0.0410
+ throughput/total_tokens=823,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4291/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=823,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4292/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=824,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4293/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=824,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4294/500000]
+ train/ActionL1Loss=0.0404
+ throughput/total_tokens=824,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4295/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=824,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4296/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=824,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4297/500000]
+ train/ActionL1Loss=0.0543
+ throughput/total_tokens=825,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4298/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=825,216,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4299/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=825,408,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4300/500000]
+ optim/total_grad_norm=6.653
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=825,600,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4301/500000]
+ train/ActionL1Loss=0.0529
+ throughput/total_tokens=825,792,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4302/500000]
+ train/ActionL1Loss=0.0552
+ throughput/total_tokens=825,984,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4303/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=826,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4304/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=826,368,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4305/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=826,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4306/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=826,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4307/500000]
+ train/ActionL1Loss=0.0484
+ throughput/total_tokens=826,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4308/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=827,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4309/500000]
+ train/ActionL1Loss=0.0510
+ throughput/total_tokens=827,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4310/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=827,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4311/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=827,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4312/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=827,904,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4313/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=828,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4314/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=828,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4315/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=828,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4316/500000]
+ train/ActionL1Loss=0.0505
+ throughput/total_tokens=828,672,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4317/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=828,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4318/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=829,056,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4319/500000]
+ train/ActionL1Loss=0.0489
+ throughput/total_tokens=829,248,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4320/500000]
+ optim/total_grad_norm=7.454
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=829,440,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4321/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=829,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4322/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=829,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4323/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=830,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4324/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=830,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4325/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=830,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4326/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=830,592,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4327/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=830,784,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4328/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=830,976,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4329/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=831,168,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4330/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=831,360,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4331/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=831,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4332/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=831,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4333/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=831,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4334/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=832,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4335/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=832,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4336/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=832,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4337/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=832,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4338/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=832,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4339/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=833,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4340/500000]
+ optim/total_grad_norm=8.577
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=833,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4341/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=833,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4342/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=833,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4343/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=833,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4344/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=834,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4345/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=834,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4346/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=834,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4347/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=834,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4348/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=834,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4349/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=835,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4350/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=835,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4351/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=835,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4352/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=835,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4353/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=835,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4354/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=835,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4355/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=836,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4356/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=836,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4357/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=836,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4358/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=836,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4359/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=836,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4360/500000]
+ optim/total_grad_norm=9.585
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=837,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=4361/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=837,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4362/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=837,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4363/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=837,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4364/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=837,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4365/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=838,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4366/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=838,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4367/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=838,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4368/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=838,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4369/500000]
+ train/ActionL1Loss=0.0534
+ throughput/total_tokens=838,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4370/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=839,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4371/500000]
+ train/ActionL1Loss=0.0566
+ throughput/total_tokens=839,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4372/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=839,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4373/500000]
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=839,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4374/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=839,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4375/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=840,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4376/500000]
+ train/ActionL1Loss=0.0557
+ throughput/total_tokens=840,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4377/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=840,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4378/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=840,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4379/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=840,768,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4380/500000]
+ optim/total_grad_norm=7.269
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=840,960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4381/500000]
+ train/ActionL1Loss=0.0463
+ throughput/total_tokens=841,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4382/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=841,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4383/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=841,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4384/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=841,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4385/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=841,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4386/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=842,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4387/500000]
+ train/ActionL1Loss=0.0404
+ throughput/total_tokens=842,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4388/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=842,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4389/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=842,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4390/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=842,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4391/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=843,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4392/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=843,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4393/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=843,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4394/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=843,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4395/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=843,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4396/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=844,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4397/500000]
+ train/ActionL1Loss=0.0469
+ throughput/total_tokens=844,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4398/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=844,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4399/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=844,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4400/500000]
+ optim/total_grad_norm=6.987
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=844,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4401/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=844,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4402/500000]
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=845,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4403/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=845,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4404/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=845,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4405/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=845,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4406/500000]
+ train/ActionL1Loss=0.0484
+ throughput/total_tokens=845,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4407/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=846,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4408/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=846,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4409/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=846,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4410/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=846,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=4411/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=846,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4412/500000]
+ train/ActionL1Loss=0.0489
+ throughput/total_tokens=847,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4413/500000]
+ train/ActionL1Loss=0.0462
+ throughput/total_tokens=847,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4414/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=847,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4415/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=847,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4416/500000]
+ train/ActionL1Loss=0.0477
+ throughput/total_tokens=847,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4417/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=848,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4418/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=848,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4419/500000]
+ train/ActionL1Loss=0.0488
+ throughput/total_tokens=848,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4420/500000]
+ optim/total_grad_norm=8.323
+ train/ActionL1Loss=0.0479
+ throughput/total_tokens=848,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4421/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=848,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4422/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=849,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4423/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=849,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4424/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=849,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4425/500000]
+ train/ActionL1Loss=0.0508
+ throughput/total_tokens=849,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4426/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=849,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4427/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=849,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4428/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=850,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4429/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=850,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4430/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=850,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4431/500000]
+ train/ActionL1Loss=0.0483
+ throughput/total_tokens=850,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4432/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=850,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4433/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=851,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4434/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=851,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4435/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=851,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4436/500000]
+ train/ActionL1Loss=0.0505
+ throughput/total_tokens=851,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4437/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=851,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4438/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=852,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4439/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=852,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4440/500000]
+ optim/total_grad_norm=10.13
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=852,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4441/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=852,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4442/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=852,864,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4443/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=853,056,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4444/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=853,248,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4445/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=853,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4446/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=853,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4447/500000]
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=853,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4448/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=854,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4449/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=854,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4450/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=854,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4451/500000]
+ train/ActionL1Loss=0.0440
+ throughput/total_tokens=854,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4452/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=854,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4453/500000]
+ train/ActionL1Loss=0.0567
+ throughput/total_tokens=854,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4454/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=855,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4455/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=855,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4456/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=855,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4457/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=855,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4458/500000]
+ train/ActionL1Loss=0.0412
+ throughput/total_tokens=855,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4459/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=856,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4460/500000]
+ optim/total_grad_norm=7.311
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=856,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4461/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=856,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4462/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=856,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4463/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=856,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4464/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=857,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4465/500000]
+ train/ActionL1Loss=0.0470
+ throughput/total_tokens=857,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4466/500000]
+ train/ActionL1Loss=0.0433
+ throughput/total_tokens=857,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4467/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=857,664,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4468/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=857,856,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4469/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=858,048,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4470/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=858,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4471/500000]
+ train/ActionL1Loss=0.0413
+ throughput/total_tokens=858,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4472/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=858,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4473/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=858,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4474/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=859,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4475/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=859,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4476/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=859,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4477/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=859,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4478/500000]
+ train/ActionL1Loss=0.0468
+ throughput/total_tokens=859,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4479/500000]
+ train/ActionL1Loss=0.0540
+ throughput/total_tokens=859,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4480/500000]
+ optim/total_grad_norm=7.753
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=860,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4481/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=860,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4482/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=860,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4483/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=860,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4484/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=860,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4485/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=861,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4486/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=861,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4487/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=861,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4488/500000]
+ train/ActionL1Loss=0.0359
+ throughput/total_tokens=861,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4489/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=861,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4490/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=862,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4491/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=862,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4492/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=862,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4493/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=862,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4494/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=862,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4495/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=863,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4496/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=863,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4497/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=863,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4498/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=863,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4499/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=863,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4500/500000]
+ optim/total_grad_norm=9.513
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=864,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/03 [18:37:40] INFO | >> Saving config... checkpoint.py:608
+10/03 [18:38:30] INFO | >> Saving model state... checkpoint.py:796
+10/03 [18:39:41] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [18:41:11] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4501/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=864,192,000
+ throughput/device/tokens_per_second=1,225
+ throughput/device/batches_per_second=0.0510
+[step=4502/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=864,384,000
+ throughput/device/tokens_per_second=1,203
+ throughput/device/batches_per_second=0.0502
+[step=4503/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=864,576,000
+ throughput/device/tokens_per_second=1,195
+ throughput/device/batches_per_second=0.0498
+[step=4504/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=864,768,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0496
+[step=4505/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=864,960,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=4506/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=865,152,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4507/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=865,344,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4508/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=865,536,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4509/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=865,728,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4510/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=865,920,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=4511/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=866,112,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4512/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=866,304,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4513/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=866,496,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4514/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=866,688,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4515/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=866,880,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4516/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=867,072,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4517/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=867,264,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4518/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=867,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4519/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=867,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4520/500000]
+ optim/total_grad_norm=8.902
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=867,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4521/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=868,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4522/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=868,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4523/500000]
+ train/ActionL1Loss=0.0845
+ throughput/total_tokens=868,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4524/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=868,608,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4525/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=868,800,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4526/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=868,992,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4527/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=869,184,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4528/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=869,376,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4529/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=869,568,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4530/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=869,760,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4531/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=869,952,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4532/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=870,144,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4533/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=870,336,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4534/500000]
+ train/ActionL1Loss=0.1372
+ throughput/total_tokens=870,528,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4535/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=870,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4536/500000]
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=870,912,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4537/500000]
+ train/ActionL1Loss=0.0464
+ throughput/total_tokens=871,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4538/500000]
+ train/ActionL1Loss=0.0466
+ throughput/total_tokens=871,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4539/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=871,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4540/500000]
+ optim/total_grad_norm=8.822
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=871,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4541/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=871,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4542/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=872,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4543/500000]
+ train/ActionL1Loss=0.0365
+ throughput/total_tokens=872,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4544/500000]
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=872,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4545/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=872,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4546/500000]
+ train/ActionL1Loss=0.0432
+ throughput/total_tokens=872,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4547/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=873,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4548/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=873,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4549/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=873,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4550/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=873,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4551/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=873,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4552/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=873,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4553/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=874,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4554/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=874,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4555/500000]
+ train/ActionL1Loss=0.0413
+ throughput/total_tokens=874,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4556/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=874,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4557/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=874,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4558/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=875,136,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=4559/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=875,328,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=4560/500000]
+ optim/total_grad_norm=8.411
+ train/ActionL1Loss=0.0441
+ throughput/total_tokens=875,520,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=4561/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=875,712,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=4562/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=875,904,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=4563/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=876,096,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=4564/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=876,288,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=4565/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=876,480,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=4566/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=876,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4567/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=876,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4568/500000]
+ train/ActionL1Loss=0.0601
+ throughput/total_tokens=877,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4569/500000]
+ train/ActionL1Loss=0.0438
+ throughput/total_tokens=877,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4570/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=877,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4571/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=877,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4572/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=877,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4573/500000]
+ train/ActionL1Loss=0.0515
+ throughput/total_tokens=878,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4574/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=878,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4575/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=878,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4576/500000]
+ train/ActionL1Loss=0.0573
+ throughput/total_tokens=878,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4577/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=878,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4578/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=878,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4579/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=879,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4580/500000]
+ optim/total_grad_norm=6.240
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=879,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4581/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=879,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4582/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=879,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4583/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=879,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4584/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=880,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4585/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=880,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4586/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=880,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4587/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=880,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4588/500000]
+ train/ActionL1Loss=0.0484
+ throughput/total_tokens=880,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4589/500000]
+ train/ActionL1Loss=0.0480
+ throughput/total_tokens=881,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4590/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=881,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4591/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=881,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4592/500000]
+ train/ActionL1Loss=0.0404
+ throughput/total_tokens=881,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4593/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=881,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4594/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=882,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4595/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=882,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4596/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=882,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4597/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=882,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4598/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=882,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4599/500000]
+ train/ActionL1Loss=0.0490
+ throughput/total_tokens=883,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4600/500000]
+ optim/total_grad_norm=8.333
+ train/ActionL1Loss=0.0575
+ throughput/total_tokens=883,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4601/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=883,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4602/500000]
+ train/ActionL1Loss=0.0505
+ throughput/total_tokens=883,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4603/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=883,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4604/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=883,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4605/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=884,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4606/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=884,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4607/500000]
+ train/ActionL1Loss=0.0516
+ throughput/total_tokens=884,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4608/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=884,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4609/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=884,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4610/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=885,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4611/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=885,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4612/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=885,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4613/500000]
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=885,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4614/500000]
+ train/ActionL1Loss=0.0365
+ throughput/total_tokens=885,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4615/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=886,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4616/500000]
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=886,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4617/500000]
+ train/ActionL1Loss=0.0433
+ throughput/total_tokens=886,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4618/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=886,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4619/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=886,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4620/500000]
+ optim/total_grad_norm=9.144
+ train/ActionL1Loss=0.0528
+ throughput/total_tokens=887,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4621/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=887,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4622/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=887,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4623/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=887,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4624/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=887,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4625/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=888,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4626/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=888,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4627/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=888,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4628/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=888,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4629/500000]
+ train/ActionL1Loss=0.0485
+ throughput/total_tokens=888,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4630/500000]
+ train/ActionL1Loss=0.0465
+ throughput/total_tokens=888,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4631/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=889,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4632/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=889,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4633/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=889,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4634/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=889,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4635/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=889,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4636/500000]
+ train/ActionL1Loss=0.0340
+ throughput/total_tokens=890,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4637/500000]
+ train/ActionL1Loss=0.0650
+ throughput/total_tokens=890,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4638/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=890,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4639/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=890,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4640/500000]
+ optim/total_grad_norm=8.682
+ train/ActionL1Loss=0.0522
+ throughput/total_tokens=890,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4641/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=891,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4642/500000]
+ train/ActionL1Loss=0.0574
+ throughput/total_tokens=891,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4643/500000]
+ train/ActionL1Loss=0.0495
+ throughput/total_tokens=891,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4644/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=891,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4645/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=891,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4646/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=892,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4647/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=892,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4648/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=892,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4649/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=892,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4650/500000]
+ train/ActionL1Loss=0.0530
+ throughput/total_tokens=892,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4651/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=892,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4652/500000]
+ train/ActionL1Loss=0.0525
+ throughput/total_tokens=893,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4653/500000]
+ train/ActionL1Loss=0.0476
+ throughput/total_tokens=893,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4654/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=893,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4655/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=893,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4656/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=893,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4657/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=894,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4658/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=894,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4659/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=894,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4660/500000]
+ optim/total_grad_norm=7.490
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=894,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4661/500000]
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=894,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4662/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=895,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4663/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=895,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4664/500000]
+ train/ActionL1Loss=0.0479
+ throughput/total_tokens=895,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4665/500000]
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=895,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4666/500000]
+ train/ActionL1Loss=0.0499
+ throughput/total_tokens=895,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4667/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=896,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4668/500000]
+ train/ActionL1Loss=0.0436
+ throughput/total_tokens=896,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4669/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=896,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4670/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=896,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4671/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=896,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4672/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=897,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4673/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=897,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4674/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=897,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4675/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=897,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4676/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=897,792,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=4677/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=897,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4678/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=898,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4679/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=898,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4680/500000]
+ optim/total_grad_norm=7.890
+ train/ActionL1Loss=0.0591
+ throughput/total_tokens=898,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4681/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=898,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4682/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=898,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4683/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=899,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4684/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=899,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4685/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=899,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4686/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=899,712,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4687/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=899,904,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4688/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=900,096,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4689/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=900,288,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4690/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=900,480,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=4691/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=900,672,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4692/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=900,864,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4693/500000]
+ train/ActionL1Loss=0.0569
+ throughput/total_tokens=901,056,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4694/500000]
+ train/ActionL1Loss=0.0541
+ throughput/total_tokens=901,248,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4695/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=901,440,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4696/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=901,632,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4697/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=901,824,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4698/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=902,016,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4699/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=902,208,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4700/500000]
+ optim/total_grad_norm=7.055
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=902,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4701/500000]
+ train/ActionL1Loss=0.0457
+ throughput/total_tokens=902,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4702/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=902,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4703/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=902,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4704/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=903,168,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4705/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=903,360,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4706/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=903,552,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4707/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=903,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4708/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=903,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4709/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=904,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4710/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=904,320,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4711/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=904,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4712/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=904,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4713/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=904,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4714/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=905,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4715/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=905,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4716/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=905,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4717/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=905,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4718/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=905,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4719/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=906,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4720/500000]
+ optim/total_grad_norm=7.844
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=906,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4721/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=906,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4722/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=906,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4723/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=906,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4724/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=907,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4725/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=907,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4726/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=907,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4727/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=907,584,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4728/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=907,776,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4729/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=907,968,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4730/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=908,160,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=4731/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=908,352,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4732/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=908,544,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4733/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=908,736,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4734/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=908,928,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4735/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=909,120,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4736/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=909,312,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4737/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=909,504,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4738/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=909,696,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4739/500000]
+ train/ActionL1Loss=0.0410
+ throughput/total_tokens=909,888,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4740/500000]
+ optim/total_grad_norm=9.139
+ train/ActionL1Loss=0.0475
+ throughput/total_tokens=910,080,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=4741/500000]
+ train/ActionL1Loss=0.0474
+ throughput/total_tokens=910,272,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4742/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=910,464,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4743/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=910,656,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4744/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=910,848,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4745/500000]
+ train/ActionL1Loss=0.0410
+ throughput/total_tokens=911,040,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4746/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=911,232,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4747/500000]
+ train/ActionL1Loss=0.0391
+ throughput/total_tokens=911,424,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4748/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=911,616,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4749/500000]
+ train/ActionL1Loss=0.0534
+ throughput/total_tokens=911,808,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4750/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=912,000,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=4751/500000]
+ train/ActionL1Loss=0.0340
+ throughput/total_tokens=912,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4752/500000]
+ train/ActionL1Loss=0.0455
+ throughput/total_tokens=912,384,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4753/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=912,576,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4754/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=912,768,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4755/500000]
+ train/ActionL1Loss=0.0493
+ throughput/total_tokens=912,960,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4756/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=913,152,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4757/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=913,344,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4758/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=913,536,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4759/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=913,728,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4760/500000]
+ optim/total_grad_norm=7.962
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=913,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4761/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=914,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4762/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=914,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4763/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=914,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4764/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=914,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4765/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=914,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4766/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=915,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4767/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=915,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4768/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=915,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4769/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=915,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4770/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=915,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4771/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=916,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4772/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=916,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4773/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=916,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4774/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=916,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4775/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=916,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4776/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=916,992,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4777/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=917,184,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4778/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=917,376,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4779/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=917,568,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4780/500000]
+ optim/total_grad_norm=9.220
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=917,760,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4781/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=917,952,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4782/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=918,144,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4783/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=918,336,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4784/500000]
+ train/ActionL1Loss=0.0460
+ throughput/total_tokens=918,528,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4785/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=918,720,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4786/500000]
+ train/ActionL1Loss=0.0576
+ throughput/total_tokens=918,912,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4787/500000]
+ train/ActionL1Loss=0.0443
+ throughput/total_tokens=919,104,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4788/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=919,296,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4789/500000]
+ train/ActionL1Loss=0.0554
+ throughput/total_tokens=919,488,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=4790/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=919,680,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=4791/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=919,872,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4792/500000]
+ train/ActionL1Loss=0.0359
+ throughput/total_tokens=920,064,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4793/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=920,256,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4794/500000]
+ train/ActionL1Loss=0.0472
+ throughput/total_tokens=920,448,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4795/500000]
+ train/ActionL1Loss=0.0580
+ throughput/total_tokens=920,640,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4796/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=920,832,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4797/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=921,024,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4798/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=921,216,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=4799/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=921,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4800/500000]
+ optim/total_grad_norm=6.949
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=921,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4801/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=921,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4802/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=921,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4803/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=922,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4804/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=922,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4805/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=922,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4806/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=922,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4807/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=922,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4808/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=923,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4809/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=923,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4810/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=923,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4811/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=923,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4812/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=923,904,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4813/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=924,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4814/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=924,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4815/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=924,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4816/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=924,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4817/500000]
+ train/ActionL1Loss=0.0449
+ throughput/total_tokens=924,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4818/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=925,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4819/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=925,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4820/500000]
+ optim/total_grad_norm=7.216
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=925,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4821/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=925,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4822/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=925,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4823/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=926,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4824/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=926,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4825/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=926,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4826/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=926,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4827/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=926,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4828/500000]
+ train/ActionL1Loss=0.0458
+ throughput/total_tokens=926,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4829/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=927,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4830/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=927,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4831/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=927,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4832/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=927,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4833/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=927,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4834/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=928,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4835/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=928,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4836/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=928,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4837/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=928,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4838/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=928,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4839/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=929,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4840/500000]
+ optim/total_grad_norm=8.865
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=929,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4841/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=929,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4842/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=929,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4843/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=929,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4844/500000]
+ train/ActionL1Loss=0.0427
+ throughput/total_tokens=930,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4845/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=930,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4846/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=930,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4847/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=930,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4848/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=930,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4849/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=931,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4850/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=931,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4851/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=931,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4852/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=931,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4853/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=931,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4854/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=931,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4855/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=932,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4856/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=932,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4857/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=932,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4858/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=932,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4859/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=932,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4860/500000]
+ optim/total_grad_norm=8.382
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=933,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4861/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=933,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4862/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=933,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4863/500000]
+ train/ActionL1Loss=0.0501
+ throughput/total_tokens=933,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4864/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=933,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4865/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=934,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4866/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=934,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4867/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=934,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4868/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=934,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4869/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=934,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4870/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=935,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4871/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=935,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4872/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=935,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4873/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=935,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4874/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=935,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4875/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=936,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4876/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=936,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4877/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=936,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4878/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=936,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4879/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=936,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4880/500000]
+ optim/total_grad_norm=7.247
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=936,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4881/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=937,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4882/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=937,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4883/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=937,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4884/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=937,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4885/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=937,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4886/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=938,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4887/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=938,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4888/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=938,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4889/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=938,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4890/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=938,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4891/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=939,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4892/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=939,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4893/500000]
+ train/ActionL1Loss=0.0459
+ throughput/total_tokens=939,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4894/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=939,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4895/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=939,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4896/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=940,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4897/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=940,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4898/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=940,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4899/500000]
+ train/ActionL1Loss=0.0413
+ throughput/total_tokens=940,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4900/500000]
+ optim/total_grad_norm=9.292
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=940,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4901/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=940,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4902/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=941,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4903/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=941,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4904/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=941,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4905/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=941,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4906/500000]
+ train/ActionL1Loss=0.0544
+ throughput/total_tokens=941,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4907/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=942,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4908/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=942,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4909/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=942,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4910/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=942,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4911/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=942,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4912/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=943,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4913/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=943,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4914/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=943,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4915/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=943,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4916/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=943,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4917/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=944,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4918/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=944,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4919/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=944,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4920/500000]
+ optim/total_grad_norm=8.591
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=944,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4921/500000]
+ train/ActionL1Loss=0.0439
+ throughput/total_tokens=944,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4922/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=945,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4923/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=945,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4924/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=945,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4925/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=945,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4926/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=945,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4927/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=945,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4928/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=946,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4929/500000]
+ train/ActionL1Loss=0.0340
+ throughput/total_tokens=946,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4930/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=946,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4931/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=946,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4932/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=946,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4933/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=947,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4934/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=947,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4935/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=947,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4936/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=947,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4937/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=947,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4938/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=948,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4939/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=948,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4940/500000]
+ optim/total_grad_norm=9.035
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=948,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4941/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=948,672,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4942/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=948,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4943/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=949,056,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4944/500000]
+ train/ActionL1Loss=0.0486
+ throughput/total_tokens=949,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4945/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=949,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4946/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=949,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4947/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=949,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4948/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=950,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4949/500000]
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=950,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=4950/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=950,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4951/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=950,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4952/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=950,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4953/500000]
+ train/ActionL1Loss=0.0425
+ throughput/total_tokens=950,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4954/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=951,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4955/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=951,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=4956/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=951,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=4957/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=951,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4958/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=951,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4959/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=952,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4960/500000]
+ optim/total_grad_norm=6.603
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=952,320,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=4961/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=952,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4962/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=952,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=4963/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=952,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4964/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=953,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4965/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=953,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4966/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=953,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4967/500000]
+ train/ActionL1Loss=0.0404
+ throughput/total_tokens=953,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4968/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=953,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4969/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=954,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=4970/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=954,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4971/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=954,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4972/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=954,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4973/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=954,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4974/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=955,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4975/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=955,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4976/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=955,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4977/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=955,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4978/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=955,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4979/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=955,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4980/500000]
+ optim/total_grad_norm=7.506
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=956,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4981/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=956,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4982/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=956,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4983/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=956,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4984/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=956,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4985/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=957,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4986/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=957,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4987/500000]
+ train/ActionL1Loss=0.0410
+ throughput/total_tokens=957,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4988/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=957,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4989/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=957,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4990/500000]
+ train/ActionL1Loss=0.0433
+ throughput/total_tokens=958,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=4991/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=958,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4992/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=958,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=4993/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=958,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4994/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=958,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4995/500000]
+ train/ActionL1Loss=0.0473
+ throughput/total_tokens=959,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4996/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=959,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4997/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=959,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4998/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=959,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=4999/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=959,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5000/500000]
+ optim/total_grad_norm=7.951
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=960,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/03 [21:31:17] INFO | >> Saving config... checkpoint.py:608
+10/03 [21:31:51] INFO | >> Saving model state... checkpoint.py:796
+10/03 [21:33:00] INFO | >> Saving optim state... checkpoint.py:811
+10/03 [21:34:25] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5001/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=960,192,000
+ throughput/device/tokens_per_second=1,218
+ throughput/device/batches_per_second=0.0508
+[step=5002/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=960,384,000
+ throughput/device/tokens_per_second=1,201
+ throughput/device/batches_per_second=0.0501
+[step=5003/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=960,576,000
+ throughput/device/tokens_per_second=1,194
+ throughput/device/batches_per_second=0.0498
+[step=5004/500000]
+ train/ActionL1Loss=0.0467
+ throughput/total_tokens=960,768,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0496
+[step=5005/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=960,960,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=5006/500000]
+ train/ActionL1Loss=0.0442
+ throughput/total_tokens=961,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5007/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=961,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5008/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=961,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5009/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=961,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5010/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=961,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5011/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=962,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5012/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=962,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5013/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=962,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5014/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=962,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5015/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=962,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5016/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=963,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5017/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=963,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5018/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=963,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5019/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=963,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5020/500000]
+ optim/total_grad_norm=8.994
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=963,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5021/500000]
+ train/ActionL1Loss=0.0340
+ throughput/total_tokens=964,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5022/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=964,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5023/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=964,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5024/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=964,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5025/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=964,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5026/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=964,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5027/500000]
+ train/ActionL1Loss=0.0484
+ throughput/total_tokens=965,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5028/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=965,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5029/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=965,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5030/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=965,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5031/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=965,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5032/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=966,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5033/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=966,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5034/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=966,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5035/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=966,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5036/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=966,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5037/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=967,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5038/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=967,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5039/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=967,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5040/500000]
+ optim/total_grad_norm=8.229
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=967,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5041/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=967,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5042/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=968,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5043/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=968,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5044/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=968,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5045/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=968,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5046/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=968,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5047/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=969,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5048/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=969,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5049/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=969,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5050/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=969,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5051/500000]
+ train/ActionL1Loss=0.0412
+ throughput/total_tokens=969,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5052/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=969,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5053/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=970,176,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5054/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=970,368,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5055/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=970,560,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5056/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=970,752,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5057/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=970,944,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5058/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=971,136,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5059/500000]
+ train/ActionL1Loss=0.0451
+ throughput/total_tokens=971,328,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5060/500000]
+ optim/total_grad_norm=9.090
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=971,520,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=5061/500000]
+ train/ActionL1Loss=0.0431
+ throughput/total_tokens=971,712,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5062/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=971,904,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5063/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=972,096,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5064/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=972,288,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5065/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=972,480,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5066/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=972,672,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5067/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=972,864,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5068/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=973,056,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5069/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=973,248,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5070/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=973,440,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5071/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=973,632,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5072/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=973,824,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5073/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=974,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5074/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=974,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5075/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=974,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5076/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=974,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5077/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=974,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5078/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=974,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5079/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=975,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5080/500000]
+ optim/total_grad_norm=7.153
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=975,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5081/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=975,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5082/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=975,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5083/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=975,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5084/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=976,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5085/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=976,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5086/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=976,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5087/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=976,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5088/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=976,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5089/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=977,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5090/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=977,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5091/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=977,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5092/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=977,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5093/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=977,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5094/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=978,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5095/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=978,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5096/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=978,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5097/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=978,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5098/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=978,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5099/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=979,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5100/500000]
+ optim/total_grad_norm=8.403
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=979,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5101/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=979,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5102/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=979,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5103/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=979,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5104/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=979,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5105/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=980,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5106/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=980,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5107/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=980,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5108/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=980,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5109/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=980,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5110/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=981,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5111/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=981,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5112/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=981,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5113/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=981,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5114/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=981,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5115/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=982,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5116/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=982,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5117/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=982,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5118/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=982,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5119/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=982,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5120/500000]
+ optim/total_grad_norm=8.855
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=983,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5121/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=983,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5122/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=983,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5123/500000]
+ train/ActionL1Loss=0.0799
+ throughput/total_tokens=983,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5124/500000]
+ train/ActionL1Loss=0.0391
+ throughput/total_tokens=983,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5125/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=984,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5126/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=984,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5127/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=984,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5128/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=984,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5129/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=984,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5130/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=984,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5131/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=985,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5132/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=985,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5133/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=985,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5134/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=985,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5135/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=985,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5136/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=986,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5137/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=986,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5138/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=986,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5139/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=986,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5140/500000]
+ optim/total_grad_norm=9.875
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=986,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5141/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=987,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5142/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=987,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5143/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=987,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5144/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=987,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5145/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=987,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5146/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=988,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5147/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=988,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5148/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=988,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5149/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=988,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5150/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=988,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5151/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=988,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5152/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=989,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5153/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=989,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5154/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=989,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5155/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=989,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5156/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=989,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5157/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=990,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5158/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=990,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5159/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=990,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5160/500000]
+ optim/total_grad_norm=7.175
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=990,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5161/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=990,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5162/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=991,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5163/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=991,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5164/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=991,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5165/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=991,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5166/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=991,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5167/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=992,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5168/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=992,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5169/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=992,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5170/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=992,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5171/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=992,832,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5172/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=993,024,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5173/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=993,216,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5174/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=993,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5175/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=993,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5176/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=993,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5177/500000]
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=993,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5178/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=994,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5179/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=994,368,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5180/500000]
+ optim/total_grad_norm=8.543
+ train/ActionL1Loss=0.0365
+ throughput/total_tokens=994,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5181/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=994,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5182/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=994,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5183/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=995,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5184/500000]
+ train/ActionL1Loss=0.0479
+ throughput/total_tokens=995,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5185/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=995,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5186/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=995,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5187/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=995,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5188/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=996,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5189/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=996,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5190/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=996,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5191/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=996,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5192/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=996,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5193/500000]
+ train/ActionL1Loss=0.0414
+ throughput/total_tokens=997,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5194/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=997,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5195/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=997,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5196/500000]
+ train/ActionL1Loss=0.0807
+ throughput/total_tokens=997,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5197/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=997,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5198/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=998,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5199/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=998,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5200/500000]
+ optim/total_grad_norm=9.678
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=998,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5201/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=998,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5202/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=998,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5203/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=998,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5204/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=999,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5205/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=999,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5206/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=999,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5207/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=999,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5208/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=999,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5209/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,000,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5210/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,000,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5211/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,000,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5212/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=1,000,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5213/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,000,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5214/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,001,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5215/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,001,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5216/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,001,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5217/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,001,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5218/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=1,001,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5219/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,002,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5220/500000]
+ optim/total_grad_norm=7.101
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,002,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5221/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=1,002,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5222/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,002,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5223/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,002,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5224/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,003,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5225/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,003,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5226/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=1,003,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5227/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=1,003,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5228/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,003,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5229/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,003,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5230/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=1,004,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5231/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,004,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5232/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=1,004,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5233/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,004,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5234/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=1,004,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5235/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,005,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5236/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,005,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5237/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,005,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5238/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,005,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5239/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,005,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5240/500000]
+ optim/total_grad_norm=6.257
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,006,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5241/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,006,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5242/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,006,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5243/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=1,006,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5244/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,006,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5245/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=1,007,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5246/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,007,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5247/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=1,007,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5248/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=1,007,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5249/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,007,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5250/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=1,008,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5251/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=1,008,192,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5252/500000]
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=1,008,384,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5253/500000]
+ train/ActionL1Loss=0.0365
+ throughput/total_tokens=1,008,576,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5254/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=1,008,768,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5255/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=1,008,960,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5256/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=1,009,152,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5257/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=1,009,344,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5258/500000]
+ train/ActionL1Loss=0.0862
+ throughput/total_tokens=1,009,536,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5259/500000]
+ train/ActionL1Loss=0.0497
+ throughput/total_tokens=1,009,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5260/500000]
+ optim/total_grad_norm=8.672
+ train/ActionL1Loss=0.0406
+ throughput/total_tokens=1,009,920,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5261/500000]
+ train/ActionL1Loss=0.0498
+ throughput/total_tokens=1,010,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5262/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=1,010,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5263/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=1,010,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5264/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=1,010,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5265/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,010,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5266/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,011,072,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5267/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=1,011,264,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5268/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=1,011,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5269/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,011,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5270/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=1,011,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5271/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,012,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5272/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=1,012,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5273/500000]
+ train/ActionL1Loss=0.0485
+ throughput/total_tokens=1,012,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5274/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=1,012,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5275/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=1,012,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5276/500000]
+ train/ActionL1Loss=0.0470
+ throughput/total_tokens=1,012,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5277/500000]
+ train/ActionL1Loss=0.0445
+ throughput/total_tokens=1,013,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5278/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,013,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5279/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=1,013,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5280/500000]
+ optim/total_grad_norm=8.851
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=1,013,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5281/500000]
+ train/ActionL1Loss=0.0419
+ throughput/total_tokens=1,013,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5282/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,014,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5283/500000]
+ train/ActionL1Loss=0.0463
+ throughput/total_tokens=1,014,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5284/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,014,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5285/500000]
+ train/ActionL1Loss=0.0479
+ throughput/total_tokens=1,014,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5286/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,014,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5287/500000]
+ train/ActionL1Loss=0.0413
+ throughput/total_tokens=1,015,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5288/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=1,015,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5289/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,015,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5290/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=1,015,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5291/500000]
+ train/ActionL1Loss=0.0384
+ throughput/total_tokens=1,015,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5292/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=1,016,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5293/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,016,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5294/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=1,016,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5295/500000]
+ train/ActionL1Loss=0.0454
+ throughput/total_tokens=1,016,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5296/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=1,016,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5297/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,017,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5298/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=1,017,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5299/500000]
+ train/ActionL1Loss=0.0405
+ throughput/total_tokens=1,017,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5300/500000]
+ optim/total_grad_norm=8.850
+ train/ActionL1Loss=0.0340
+ throughput/total_tokens=1,017,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5301/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,017,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5302/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,017,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5303/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=1,018,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5304/500000]
+ train/ActionL1Loss=0.0481
+ throughput/total_tokens=1,018,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5305/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,018,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5306/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,018,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5307/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,018,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5308/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=1,019,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5309/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,019,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5310/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,019,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5311/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,019,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5312/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=1,019,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5313/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,020,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5314/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,020,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5315/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=1,020,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5316/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,020,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5317/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=1,020,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5318/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=1,021,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5319/500000]
+ train/ActionL1Loss=0.0499
+ throughput/total_tokens=1,021,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5320/500000]
+ optim/total_grad_norm=9.424
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=1,021,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5321/500000]
+ train/ActionL1Loss=0.0418
+ throughput/total_tokens=1,021,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5322/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,021,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5323/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,022,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5324/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,022,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5325/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=1,022,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5326/500000]
+ train/ActionL1Loss=0.0456
+ throughput/total_tokens=1,022,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5327/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=1,022,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5328/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=1,022,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5329/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,023,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5330/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=1,023,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5331/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=1,023,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5332/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=1,023,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5333/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,023,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5334/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,024,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5335/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,024,320,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5336/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,024,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5337/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=1,024,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5338/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,024,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5339/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=1,025,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5340/500000]
+ optim/total_grad_norm=6.511
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,025,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5341/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,025,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5342/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,025,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5343/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,025,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5344/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,026,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5345/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,026,240,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5346/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,026,432,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5347/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,026,624,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5348/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=1,026,816,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5349/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,027,008,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5350/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=1,027,200,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5351/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=1,027,392,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5352/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=1,027,584,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5353/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=1,027,776,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5354/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,027,968,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5355/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,028,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5356/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=1,028,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5357/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,028,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5358/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,028,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5359/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=1,028,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5360/500000]
+ optim/total_grad_norm=7.941
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=1,029,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5361/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,029,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5362/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=1,029,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5363/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,029,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5364/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,029,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5365/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,030,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5366/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,030,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5367/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=1,030,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5368/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,030,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5369/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,030,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5370/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=1,031,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5371/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,031,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5372/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,031,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5373/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,031,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5374/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,031,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5375/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,032,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5376/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,032,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5377/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=1,032,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5378/500000]
+ train/ActionL1Loss=0.0410
+ throughput/total_tokens=1,032,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5379/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,032,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5380/500000]
+ optim/total_grad_norm=7.773
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,032,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5381/500000]
+ train/ActionL1Loss=0.0524
+ throughput/total_tokens=1,033,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5382/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=1,033,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5383/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=1,033,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5384/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,033,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5385/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,033,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5386/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,034,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5387/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,034,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5388/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=1,034,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5389/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,034,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5390/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,034,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5391/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,035,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5392/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=1,035,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5393/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,035,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5394/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=1,035,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5395/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,035,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5396/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,036,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5397/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,036,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5398/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,036,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5399/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=1,036,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5400/500000]
+ optim/total_grad_norm=8.136
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,036,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5401/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=1,036,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5402/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,037,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5403/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,037,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5404/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,037,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5405/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=1,037,760,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5406/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,037,952,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5407/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,038,144,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5408/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=1,038,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5409/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,038,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5410/500000]
+ train/ActionL1Loss=0.0429
+ throughput/total_tokens=1,038,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5411/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=1,038,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5412/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,039,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5413/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,039,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5414/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,039,488,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5415/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,039,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5416/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,039,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5417/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,040,064,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5418/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=1,040,256,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5419/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,040,448,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5420/500000]
+ optim/total_grad_norm=7.963
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,040,640,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5421/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,040,832,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5422/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,041,024,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5423/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=1,041,216,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5424/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,041,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5425/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=1,041,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5426/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,041,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5427/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,041,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5428/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,042,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5429/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=1,042,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5430/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,042,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5431/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,042,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5432/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,042,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5433/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,043,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5434/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,043,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5435/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,043,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5436/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,043,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5437/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,043,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5438/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,044,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5439/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,044,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5440/500000]
+ optim/total_grad_norm=6.950
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=1,044,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5441/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,044,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5442/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,044,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5443/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,045,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5444/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,045,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5445/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,045,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5446/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,045,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5447/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,045,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5448/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,046,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5449/500000]
+ train/ActionL1Loss=0.0359
+ throughput/total_tokens=1,046,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5450/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,046,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5451/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=1,046,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5452/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,046,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5453/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,046,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5454/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,047,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5455/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=1,047,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5456/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,047,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5457/500000]
+ train/ActionL1Loss=0.0408
+ throughput/total_tokens=1,047,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5458/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,047,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5459/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,048,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5460/500000]
+ optim/total_grad_norm=9.471
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,048,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5461/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,048,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5462/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,048,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5463/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,048,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5464/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,049,088,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5465/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,049,280,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5466/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,049,472,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5467/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,049,664,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5468/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,049,856,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5469/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=1,050,048,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5470/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,050,240,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5471/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,050,432,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5472/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,050,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5473/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=1,050,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5474/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,051,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5475/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=1,051,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5476/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,051,392,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5477/500000]
+ train/ActionL1Loss=0.0403
+ throughput/total_tokens=1,051,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5478/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,051,776,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5479/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,051,968,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5480/500000]
+ optim/total_grad_norm=9.128
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,052,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5481/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,052,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5482/500000]
+ train/ActionL1Loss=0.0365
+ throughput/total_tokens=1,052,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5483/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,052,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5484/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=1,052,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5485/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=1,053,120,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5486/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,053,312,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5487/500000]
+ train/ActionL1Loss=0.0484
+ throughput/total_tokens=1,053,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5488/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,053,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5489/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,053,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5490/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=1,054,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5491/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=1,054,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5492/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=1,054,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5493/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=1,054,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5494/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,054,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5495/500000]
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=1,055,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5496/500000]
+ train/ActionL1Loss=0.0432
+ throughput/total_tokens=1,055,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5497/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=1,055,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5498/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=1,055,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5499/500000]
+ train/ActionL1Loss=0.0491
+ throughput/total_tokens=1,055,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5500/500000]
+ optim/total_grad_norm=8.474
+ train/ActionL1Loss=0.0368
+ throughput/total_tokens=1,056,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/04 [00:24:49] INFO | >> Saving config... checkpoint.py:608
+10/04 [00:25:22] INFO | >> Saving model state... checkpoint.py:796
+10/04 [00:26:32] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [00:28:04] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5501/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,056,192,000
+ throughput/device/tokens_per_second=1,210
+ throughput/device/batches_per_second=0.0504
+[step=5502/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,056,384,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=5503/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,056,576,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=5504/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=1,056,768,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=5505/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=1,056,960,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=5506/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,057,152,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5507/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=1,057,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5508/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,057,536,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=5509/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,057,728,000
+ throughput/device/tokens_per_second=1,160
+ throughput/device/batches_per_second=0.0484
+[step=5510/500000]
+ train/ActionL1Loss=0.0391
+ throughput/total_tokens=1,057,920,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+ System/Peak GPU Memory (MB)=46,917
+[step=5511/500000]
+ train/ActionL1Loss=0.0444
+ throughput/total_tokens=1,058,112,000
+ throughput/device/tokens_per_second=1,165
+ throughput/device/batches_per_second=0.0486
+[step=5512/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=1,058,304,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=5513/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=1,058,496,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=5514/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=1,058,688,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=5515/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=1,058,880,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=5516/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=1,059,072,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=5517/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,059,264,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=5518/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=1,059,456,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=5519/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=1,059,648,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=5520/500000]
+ optim/total_grad_norm=7.844
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,059,840,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+ System/Peak GPU Memory (MB)=46,917
+[step=5521/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=1,060,032,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=5522/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=1,060,224,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=5523/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,060,416,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5524/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=1,060,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5525/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,060,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5526/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,060,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5527/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,061,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5528/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,061,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5529/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,061,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5530/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=1,061,760,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5531/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,061,952,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5532/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=1,062,144,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5533/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,062,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5534/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=1,062,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5535/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,062,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5536/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,062,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5537/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,063,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5538/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,063,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5539/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,063,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5540/500000]
+ optim/total_grad_norm=9.622
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,063,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5541/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,063,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5542/500000]
+ train/ActionL1Loss=0.0417
+ throughput/total_tokens=1,064,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5543/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,064,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5544/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,064,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5545/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,064,640,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5546/500000]
+ train/ActionL1Loss=0.0404
+ throughput/total_tokens=1,064,832,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5547/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=1,065,024,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5548/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,065,216,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5549/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,065,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5550/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=1,065,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5551/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=1,065,792,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5552/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,065,984,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5553/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,066,176,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5554/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,066,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5555/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=1,066,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5556/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=1,066,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5557/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,066,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5558/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,067,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5559/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,067,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5560/500000]
+ optim/total_grad_norm=7.660
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,067,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5561/500000]
+ train/ActionL1Loss=0.0407
+ throughput/total_tokens=1,067,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5562/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,067,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5563/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,068,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5564/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=1,068,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5565/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,068,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5566/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,068,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5567/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=1,068,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5568/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,069,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5569/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,069,248,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5570/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,069,440,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5571/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,069,632,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5572/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=1,069,824,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5573/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,070,016,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5574/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,070,208,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5575/500000]
+ train/ActionL1Loss=0.0444
+ throughput/total_tokens=1,070,400,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5576/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,070,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5577/500000]
+ train/ActionL1Loss=0.0413
+ throughput/total_tokens=1,070,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5578/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,070,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5579/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,071,168,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5580/500000]
+ optim/total_grad_norm=8.332
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,071,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5581/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,071,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5582/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,071,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5583/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,071,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5584/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,072,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5585/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=1,072,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5586/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=1,072,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5587/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,072,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5588/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,072,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5589/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,073,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5590/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,073,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5591/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,073,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5592/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,073,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5593/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,073,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5594/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=1,074,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5595/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,074,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5596/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,074,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5597/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,074,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5598/500000]
+ train/ActionL1Loss=0.0401
+ throughput/total_tokens=1,074,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5599/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,075,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5600/500000]
+ optim/total_grad_norm=9.973
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=1,075,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5601/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,075,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5602/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,075,584,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5603/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=1,075,776,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5604/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=1,075,968,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5605/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=1,076,160,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5606/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=1,076,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5607/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,076,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5608/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,076,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5609/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=1,076,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5610/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,077,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5611/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,077,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5612/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=1,077,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5613/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=1,077,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5614/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,077,888,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5615/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,078,080,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5616/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,078,272,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5617/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=1,078,464,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5618/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,078,656,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=5619/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,078,848,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5620/500000]
+ optim/total_grad_norm=7.751
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=1,079,040,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5621/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=1,079,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5622/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,079,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5623/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,079,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5624/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,079,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5625/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,080,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5626/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,080,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5627/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,080,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5628/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=1,080,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5629/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,080,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5630/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,080,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5631/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=1,081,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5632/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,081,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5633/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,081,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5634/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,081,728,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5635/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,081,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5636/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,082,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5637/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,082,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5638/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,082,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5639/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,082,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5640/500000]
+ optim/total_grad_norm=7.825
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,082,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5641/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,083,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5642/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=1,083,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5643/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,083,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5644/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,083,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5645/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,083,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5646/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,084,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5647/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,084,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5648/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,084,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5649/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,084,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5650/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,084,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5651/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=1,084,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5652/500000]
+ train/ActionL1Loss=0.0422
+ throughput/total_tokens=1,085,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5653/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,085,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5654/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,085,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5655/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=1,085,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5656/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,085,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5657/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,086,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5658/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,086,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5659/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=1,086,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5660/500000]
+ optim/total_grad_norm=5.916
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,086,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5661/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,086,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5662/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=1,087,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5663/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,087,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5664/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,087,488,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5665/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,087,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5666/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,087,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5667/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,088,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5668/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=1,088,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5669/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,088,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5670/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=1,088,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5671/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,088,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5672/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,089,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5673/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,089,216,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5674/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=1,089,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5675/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,089,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5676/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,089,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5677/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,089,984,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5678/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,090,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5679/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,090,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5680/500000]
+ optim/total_grad_norm=9.399
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,090,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5681/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=1,090,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5682/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,090,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5683/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,091,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5684/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,091,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5685/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,091,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5686/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,091,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5687/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=1,091,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5688/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,092,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5689/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=1,092,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5690/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,092,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5691/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=1,092,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5692/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,092,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5693/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,093,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5694/500000]
+ train/ActionL1Loss=0.0428
+ throughput/total_tokens=1,093,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5695/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,093,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5696/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,093,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5697/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,093,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5698/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,094,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5699/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,094,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5700/500000]
+ optim/total_grad_norm=8.184
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=1,094,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5701/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,094,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5702/500000]
+ train/ActionL1Loss=0.0415
+ throughput/total_tokens=1,094,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5703/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,094,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5704/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,095,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5705/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,095,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5706/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,095,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5707/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,095,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5708/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=1,095,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5709/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,096,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5710/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,096,320,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5711/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,096,512,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5712/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,096,704,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5713/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,096,896,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5714/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=1,097,088,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5715/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=1,097,280,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5716/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=1,097,472,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5717/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,097,664,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5718/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,097,856,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5719/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,098,048,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5720/500000]
+ optim/total_grad_norm=8.358
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,098,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5721/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=1,098,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5722/500000]
+ train/ActionL1Loss=0.0359
+ throughput/total_tokens=1,098,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5723/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,098,816,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5724/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,099,008,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5725/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,099,200,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5726/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,099,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5727/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,099,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5728/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,099,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5729/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,099,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5730/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=1,100,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5731/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,100,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5732/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,100,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5733/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,100,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5734/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=1,100,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5735/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=1,101,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5736/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,101,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5737/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,101,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5738/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,101,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5739/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,101,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5740/500000]
+ optim/total_grad_norm=7.727
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,102,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5741/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,102,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5742/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,102,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5743/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,102,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5744/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,102,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5745/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=1,103,040,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5746/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,103,232,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5747/500000]
+ train/ActionL1Loss=0.0423
+ throughput/total_tokens=1,103,424,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5748/500000]
+ train/ActionL1Loss=0.0421
+ throughput/total_tokens=1,103,616,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5749/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,103,808,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5750/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,104,000,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5751/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,104,192,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5752/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,104,384,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5753/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,104,576,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5754/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,104,768,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5755/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=1,104,960,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5756/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=1,105,152,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5757/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,105,344,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5758/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,105,536,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5759/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,105,728,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5760/500000]
+ optim/total_grad_norm=7.870
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,105,920,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5761/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,106,112,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5762/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,106,304,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5763/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,106,496,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5764/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=1,106,688,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5765/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,106,880,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5766/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,107,072,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5767/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,107,264,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5768/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,107,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5769/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,107,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5770/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,107,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5771/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=1,108,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5772/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=1,108,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5773/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=1,108,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5774/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,108,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5775/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,108,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5776/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,108,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5777/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,109,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5778/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,109,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5779/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,109,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5780/500000]
+ optim/total_grad_norm=7.329
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,109,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5781/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,109,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5782/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,110,144,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5783/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,110,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5784/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,110,528,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5785/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,110,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5786/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,110,912,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5787/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,111,104,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5788/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,111,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5789/500000]
+ train/ActionL1Loss=0.0420
+ throughput/total_tokens=1,111,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5790/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=1,111,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5791/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,111,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5792/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,112,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5793/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,112,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5794/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,112,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5795/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=1,112,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5796/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=1,112,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5797/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,113,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5798/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,113,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5799/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,113,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5800/500000]
+ optim/total_grad_norm=7.586
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,113,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5801/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=1,113,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5802/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,113,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5803/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,114,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5804/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,114,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5805/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,114,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5806/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,114,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5807/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=1,114,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5808/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,115,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5809/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,115,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5810/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,115,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5811/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,115,712,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=5812/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=1,115,904,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=5813/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,116,096,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=5814/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,116,288,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=5815/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,116,480,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=5816/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,116,672,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=5817/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,116,864,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=5818/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,117,056,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=5819/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,117,248,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=5820/500000]
+ optim/total_grad_norm=8.184
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,117,440,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5821/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,117,632,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5822/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=1,117,824,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5823/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,118,016,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5824/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,118,208,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5825/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,118,400,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5826/500000]
+ train/ActionL1Loss=0.0374
+ throughput/total_tokens=1,118,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5827/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,118,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5828/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=1,118,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5829/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,119,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5830/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,119,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5831/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,119,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5832/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=1,119,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5833/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=1,119,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5834/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,120,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5835/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,120,320,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5836/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,120,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5837/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,120,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5838/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,120,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5839/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,121,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5840/500000]
+ optim/total_grad_norm=9.596
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,121,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5841/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,121,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5842/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,121,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5843/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,121,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5844/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,122,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5845/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,122,240,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5846/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,122,432,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5847/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,122,624,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5848/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,122,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5849/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,123,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5850/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,123,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5851/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,123,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5852/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,123,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5853/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,123,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5854/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,123,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5855/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,124,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5856/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,124,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5857/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,124,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5858/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,124,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5859/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,124,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5860/500000]
+ optim/total_grad_norm=8.537
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,125,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5861/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,125,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5862/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,125,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5863/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,125,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5864/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,125,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5865/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,126,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5866/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,126,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5867/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,126,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5868/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,126,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5869/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,126,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5870/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,127,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5871/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,127,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5872/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,127,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5873/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,127,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5874/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,127,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5875/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=1,128,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5876/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=1,128,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5877/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=1,128,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5878/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,128,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5879/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,128,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5880/500000]
+ optim/total_grad_norm=7.471
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,128,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5881/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,129,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5882/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,129,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5883/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,129,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5884/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,129,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5885/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,129,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5886/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,130,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5887/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,130,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5888/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,130,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5889/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,130,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5890/500000]
+ train/ActionL1Loss=0.0416
+ throughput/total_tokens=1,130,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5891/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,131,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5892/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,131,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5893/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,131,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5894/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,131,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5895/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,131,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5896/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,132,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5897/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,132,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5898/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,132,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5899/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,132,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5900/500000]
+ optim/total_grad_norm=9.003
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=1,132,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5901/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,132,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5902/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,133,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5903/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,133,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5904/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,133,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5905/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,133,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5906/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,133,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5907/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=1,134,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5908/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,134,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5909/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=1,134,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5910/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,134,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5911/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,134,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5912/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,135,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5913/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=1,135,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5914/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,135,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5915/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,135,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5916/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,135,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5917/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,136,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5918/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,136,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5919/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,136,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5920/500000]
+ optim/total_grad_norm=7.721
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,136,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5921/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,136,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5922/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,137,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5923/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,137,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5924/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,137,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5925/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,137,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5926/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,137,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5927/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,137,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5928/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,138,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5929/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,138,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5930/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,138,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5931/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,138,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=5932/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,138,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5933/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,139,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5934/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,139,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5935/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,139,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5936/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,139,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5937/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,139,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5938/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,140,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5939/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=1,140,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5940/500000]
+ optim/total_grad_norm=8.963
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,140,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5941/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,140,672,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5942/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,140,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=5943/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,141,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5944/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,141,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5945/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,141,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5946/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,141,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5947/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=1,141,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5948/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,142,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5949/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,142,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=5950/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,142,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=5951/500000]
+ train/ActionL1Loss=0.0365
+ throughput/total_tokens=1,142,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5952/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,142,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5953/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,142,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5954/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,143,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5955/500000]
+ train/ActionL1Loss=0.0461
+ throughput/total_tokens=1,143,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=5956/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,143,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5957/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,143,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5958/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=1,143,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5959/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,144,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5960/500000]
+ optim/total_grad_norm=9.601
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,144,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=5961/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=1,144,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5962/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,144,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5963/500000]
+ train/ActionL1Loss=0.0380
+ throughput/total_tokens=1,144,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5964/500000]
+ train/ActionL1Loss=0.0386
+ throughput/total_tokens=1,145,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5965/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,145,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5966/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,145,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5967/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,145,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=5968/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,145,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5969/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,146,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=5970/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,146,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5971/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=1,146,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5972/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,146,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5973/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,146,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5974/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,147,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5975/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,147,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5976/500000]
+ train/ActionL1Loss=0.0446
+ throughput/total_tokens=1,147,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5977/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=1,147,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5978/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,147,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5979/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,147,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5980/500000]
+ optim/total_grad_norm=8.355
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,148,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5981/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,148,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5982/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=1,148,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5983/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,148,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5984/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,148,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5985/500000]
+ train/ActionL1Loss=0.0434
+ throughput/total_tokens=1,149,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5986/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,149,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=5987/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=1,149,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5988/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,149,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5989/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,149,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5990/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,150,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=5991/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=1,150,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5992/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=1,150,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5993/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,150,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5994/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,150,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5995/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=1,151,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5996/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,151,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5997/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,151,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5998/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,151,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=5999/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,151,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6000/500000]
+ optim/total_grad_norm=9.641
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,152,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/04 [03:18:14] INFO | >> Saving config... checkpoint.py:608
+10/04 [03:19:08] INFO | >> Saving model state... checkpoint.py:796
+10/04 [03:20:20] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [03:21:52] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6001/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,152,192,000
+ throughput/device/tokens_per_second=1,219
+ throughput/device/batches_per_second=0.0508
+[step=6002/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=1,152,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6003/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,152,576,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=6004/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,152,768,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6005/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,152,960,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6006/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,153,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6007/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,153,344,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6008/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,153,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6009/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,153,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6010/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,153,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6011/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,154,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6012/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,154,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6013/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,154,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6014/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,154,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6015/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,154,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6016/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,155,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6017/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,155,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6018/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=1,155,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6019/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,155,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6020/500000]
+ optim/total_grad_norm=7.029
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,155,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6021/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,156,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6022/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,156,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6023/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,156,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6024/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,156,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6025/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=1,156,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6026/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,156,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6027/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,157,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6028/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,157,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6029/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,157,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6030/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,157,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6031/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,157,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6032/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,158,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6033/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,158,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6034/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,158,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6035/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,158,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6036/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,158,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6037/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,159,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6038/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,159,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6039/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,159,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6040/500000]
+ optim/total_grad_norm=8.426
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,159,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6041/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,159,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6042/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,160,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6043/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,160,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6044/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=1,160,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6045/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,160,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6046/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,160,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6047/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=1,161,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6048/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,161,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6049/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,161,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6050/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,161,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6051/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,161,792,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6052/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,161,984,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6053/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,162,176,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6054/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,162,368,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6055/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=1,162,560,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6056/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,162,752,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6057/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,162,944,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6058/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,163,136,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6059/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,163,328,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6060/500000]
+ optim/total_grad_norm=9.157
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,163,520,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6061/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,163,712,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6062/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,163,904,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6063/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,164,096,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6064/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,164,288,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6065/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,164,480,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6066/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=1,164,672,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6067/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,164,864,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6068/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,165,056,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6069/500000]
+ train/ActionL1Loss=0.0377
+ throughput/total_tokens=1,165,248,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6070/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,165,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6071/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,165,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6072/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,165,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6073/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,166,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6074/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,166,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6075/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,166,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6076/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,166,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6077/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,166,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6078/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,166,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6079/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,167,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6080/500000]
+ optim/total_grad_norm=6.895
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,167,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6081/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,167,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6082/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,167,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6083/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=1,167,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6084/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=1,168,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6085/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,168,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6086/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=1,168,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6087/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,168,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6088/500000]
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=1,168,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6089/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,169,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6090/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,169,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6091/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,169,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6092/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,169,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6093/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,169,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6094/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=1,170,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6095/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,170,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6096/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,170,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6097/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,170,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6098/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=1,170,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6099/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,171,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6100/500000]
+ optim/total_grad_norm=10.10
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,171,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6101/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,171,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6102/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,171,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6103/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,171,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6104/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,171,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6105/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,172,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6106/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,172,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6107/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,172,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6108/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=1,172,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6109/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,172,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6110/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,173,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6111/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,173,312,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6112/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,173,504,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=6113/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=1,173,696,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=6114/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,173,888,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6115/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,174,080,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6116/500000]
+ train/ActionL1Loss=0.0340
+ throughput/total_tokens=1,174,272,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6117/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,174,464,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6118/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,174,656,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6119/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,174,848,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6120/500000]
+ optim/total_grad_norm=5.861
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,175,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6121/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,175,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6122/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,175,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6123/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,175,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6124/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,175,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6125/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,176,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6126/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,176,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6127/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,176,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6128/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,176,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6129/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,176,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6130/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,176,960,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6131/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,177,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6132/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,177,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6133/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,177,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6134/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,177,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6135/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,177,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6136/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,178,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6137/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,178,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6138/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,178,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6139/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,178,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6140/500000]
+ optim/total_grad_norm=8.723
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,178,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6141/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,179,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6142/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,179,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6143/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,179,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6144/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,179,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6145/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=1,179,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6146/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,180,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6147/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,180,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6148/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,180,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6149/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,180,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6150/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,180,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6151/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,180,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6152/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,181,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6153/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,181,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6154/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,181,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6155/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,181,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6156/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,181,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6157/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,182,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6158/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=1,182,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6159/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,182,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6160/500000]
+ optim/total_grad_norm=7.813
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,182,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6161/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,182,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6162/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,183,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6163/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,183,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6164/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,183,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6165/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,183,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6166/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,183,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6167/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,184,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6168/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,184,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6169/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,184,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6170/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,184,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6171/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,184,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6172/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,185,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6173/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,185,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6174/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,185,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6175/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=1,185,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6176/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,185,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6177/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=1,185,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6178/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,186,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6179/500000]
+ train/ActionL1Loss=0.0372
+ throughput/total_tokens=1,186,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6180/500000]
+ optim/total_grad_norm=9.126
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,186,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6181/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,186,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6182/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,186,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6183/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=1,187,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6184/500000]
+ train/ActionL1Loss=0.0437
+ throughput/total_tokens=1,187,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6185/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=1,187,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6186/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=1,187,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6187/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=1,187,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6188/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,188,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6189/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,188,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6190/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=1,188,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6191/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,188,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6192/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,188,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6193/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,189,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6194/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,189,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6195/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,189,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6196/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,189,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6197/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,189,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6198/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,190,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6199/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,190,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6200/500000]
+ optim/total_grad_norm=11.68
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,190,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6201/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,190,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6202/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,190,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6203/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,190,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6204/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,191,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6205/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,191,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6206/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,191,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6207/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,191,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6208/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,191,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6209/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,192,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6210/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,192,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6211/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,192,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6212/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,192,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6213/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=1,192,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6214/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,193,088,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6215/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,193,280,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6216/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,193,472,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6217/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,193,664,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6218/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,193,856,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6219/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,194,048,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6220/500000]
+ optim/total_grad_norm=7.065
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,194,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6221/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,194,432,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6222/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,194,624,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6223/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,194,816,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6224/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,195,008,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6225/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,195,200,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6226/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,195,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6227/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,195,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6228/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,195,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6229/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,195,968,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6230/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,196,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6231/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,196,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6232/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,196,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6233/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,196,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6234/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,196,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6235/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=1,197,120,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6236/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,197,312,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6237/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,197,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6238/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,197,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6239/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,197,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6240/500000]
+ optim/total_grad_norm=9.567
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=1,198,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6241/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,198,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6242/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,198,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6243/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,198,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6244/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,198,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6245/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,199,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6246/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,199,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6247/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,199,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6248/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,199,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6249/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,199,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6250/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,200,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6251/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,200,192,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6252/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,200,384,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6253/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,200,576,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6254/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,200,768,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6255/500000]
+ train/ActionL1Loss=0.0359
+ throughput/total_tokens=1,200,960,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6256/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=1,201,152,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6257/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,201,344,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6258/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,201,536,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6259/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,201,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6260/500000]
+ optim/total_grad_norm=7.840
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,201,920,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6261/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,202,112,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6262/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,202,304,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6263/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,202,496,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6264/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,202,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6265/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,202,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6266/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,203,072,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6267/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,203,264,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6268/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,203,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6269/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,203,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6270/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,203,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6271/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,204,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6272/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,204,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6273/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,204,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6274/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,204,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6275/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,204,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6276/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,204,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6277/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,205,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6278/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,205,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6279/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,205,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6280/500000]
+ optim/total_grad_norm=6.575
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,205,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6281/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,205,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6282/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,206,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6283/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,206,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6284/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,206,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6285/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,206,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6286/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,206,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6287/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,207,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6288/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,207,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6289/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,207,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6290/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,207,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6291/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,207,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6292/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,208,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6293/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,208,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6294/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,208,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6295/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,208,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6296/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,208,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6297/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,209,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6298/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,209,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6299/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,209,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6300/500000]
+ optim/total_grad_norm=8.317
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,209,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6301/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=1,209,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6302/500000]
+ train/ActionL1Loss=0.0430
+ throughput/total_tokens=1,209,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6303/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,210,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6304/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,210,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6305/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,210,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6306/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,210,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6307/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,210,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6308/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,211,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6309/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,211,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6310/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=1,211,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6311/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,211,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6312/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,211,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6313/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,212,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6314/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,212,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6315/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,212,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6316/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,212,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6317/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,212,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6318/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,213,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6319/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,213,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6320/500000]
+ optim/total_grad_norm=7.997
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,213,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6321/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,213,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6322/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,213,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6323/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,214,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6324/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,214,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6325/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,214,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6326/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,214,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6327/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,214,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6328/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,214,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6329/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,215,168,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6330/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,215,360,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6331/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,215,552,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6332/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,215,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6333/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,215,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6334/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,216,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6335/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,216,320,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6336/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,216,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6337/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,216,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6338/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,216,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6339/500000]
+ train/ActionL1Loss=0.0395
+ throughput/total_tokens=1,217,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6340/500000]
+ optim/total_grad_norm=8.337
+ train/ActionL1Loss=0.0409
+ throughput/total_tokens=1,217,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6341/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,217,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6342/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,217,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6343/500000]
+ train/ActionL1Loss=0.0402
+ throughput/total_tokens=1,217,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6344/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,218,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6345/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,218,240,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6346/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=1,218,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6347/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,218,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6348/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,218,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6349/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,219,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6350/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,219,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6351/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,219,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6352/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,219,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6353/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,219,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6354/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,219,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6355/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,220,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6356/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,220,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6357/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,220,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6358/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,220,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6359/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,220,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6360/500000]
+ optim/total_grad_norm=7.077
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,221,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6361/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,221,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6362/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,221,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6363/500000]
+ train/ActionL1Loss=0.0362
+ throughput/total_tokens=1,221,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6364/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,221,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6365/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,222,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6366/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,222,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6367/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,222,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6368/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,222,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6369/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,222,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6370/500000]
+ train/ActionL1Loss=0.0394
+ throughput/total_tokens=1,223,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6371/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,223,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6372/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,223,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6373/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,223,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6374/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,223,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6375/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,224,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6376/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,224,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6377/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,224,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6378/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,224,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6379/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,224,768,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6380/500000]
+ optim/total_grad_norm=7.318
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,224,960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6381/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,225,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6382/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=1,225,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6383/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,225,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6384/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,225,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6385/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,225,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6386/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,226,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6387/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,226,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6388/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,226,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6389/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,226,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6390/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,226,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6391/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,227,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6392/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,227,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6393/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,227,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6394/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,227,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6395/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,227,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6396/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,228,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6397/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,228,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6398/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,228,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6399/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,228,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6400/500000]
+ optim/total_grad_norm=7.338
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,228,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6401/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,228,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6402/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,229,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6403/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,229,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6404/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,229,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6405/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,229,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6406/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,229,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6407/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,230,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6408/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,230,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6409/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,230,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6410/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,230,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6411/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,230,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6412/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,231,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6413/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,231,296,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6414/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,231,488,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6415/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,231,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6416/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,231,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6417/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,232,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6418/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,232,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6419/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,232,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6420/500000]
+ optim/total_grad_norm=8.177
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,232,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6421/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,232,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6422/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,233,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6423/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,233,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6424/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,233,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6425/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=1,233,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6426/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,233,792,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6427/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,233,984,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6428/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,234,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6429/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,234,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6430/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,234,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6431/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,234,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6432/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,234,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6433/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,235,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6434/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,235,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6435/500000]
+ train/ActionL1Loss=0.0424
+ throughput/total_tokens=1,235,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6436/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,235,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6437/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,235,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6438/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,236,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6439/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,236,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6440/500000]
+ optim/total_grad_norm=7.705
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,236,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6441/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,236,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6442/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,236,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6443/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,237,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6444/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,237,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6445/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,237,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6446/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,237,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6447/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,237,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6448/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,238,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6449/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,238,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6450/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,238,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6451/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,238,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6452/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,238,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6453/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,238,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6454/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,239,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6455/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,239,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6456/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,239,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6457/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,239,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6458/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,239,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6459/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,240,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6460/500000]
+ optim/total_grad_norm=7.636
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,240,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6461/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,240,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6462/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,240,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6463/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,240,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6464/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,241,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6465/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,241,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6466/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,241,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6467/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,241,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6468/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,241,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6469/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,242,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6470/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,242,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6471/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,242,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6472/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,242,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6473/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,242,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6474/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,243,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6475/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,243,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6476/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,243,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6477/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,243,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6478/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,243,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6479/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,243,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6480/500000]
+ optim/total_grad_norm=6.270
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,244,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6481/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,244,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6482/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,244,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6483/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,244,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6484/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,244,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6485/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,245,120,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6486/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,245,312,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6487/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,245,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6488/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,245,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6489/500000]
+ train/ActionL1Loss=0.0378
+ throughput/total_tokens=1,245,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6490/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,246,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6491/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,246,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6492/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,246,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6493/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,246,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6494/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=1,246,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6495/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,247,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6496/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,247,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6497/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,247,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6498/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,247,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6499/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,247,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6500/500000]
+ optim/total_grad_norm=6.788
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,248,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+10/04 [06:12:11] INFO | >> Saving config... checkpoint.py:608
+10/04 [06:12:47] INFO | >> Saving model state... checkpoint.py:796
+10/04 [06:13:58] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [06:15:29] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6501/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,248,192,000
+ throughput/device/tokens_per_second=1,217
+ throughput/device/batches_per_second=0.0507
+[step=6502/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,248,384,000
+ throughput/device/tokens_per_second=1,198
+ throughput/device/batches_per_second=0.0500
+[step=6503/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,248,576,000
+ throughput/device/tokens_per_second=1,194
+ throughput/device/batches_per_second=0.0498
+[step=6504/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,248,768,000
+ throughput/device/tokens_per_second=1,192
+ throughput/device/batches_per_second=0.0497
+[step=6505/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,248,960,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0497
+[step=6506/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,249,152,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=6507/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,249,344,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=6508/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,249,536,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=6509/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,249,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6510/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,249,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6511/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,250,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6512/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,250,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6513/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,250,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6514/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=1,250,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6515/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,250,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6516/500000]
+ train/ActionL1Loss=0.0447
+ throughput/total_tokens=1,251,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6517/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,251,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6518/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,251,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6519/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,251,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6520/500000]
+ optim/total_grad_norm=8.982
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,251,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6521/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,252,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6522/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,252,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6523/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,252,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6524/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,252,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6525/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,252,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6526/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,252,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6527/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,253,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6528/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,253,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6529/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,253,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6530/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,253,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6531/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,253,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6532/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,254,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6533/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,254,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6534/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,254,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6535/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,254,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6536/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,254,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6537/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,255,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6538/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,255,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6539/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,255,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6540/500000]
+ optim/total_grad_norm=9.432
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,255,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6541/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,255,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6542/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,256,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6543/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,256,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6544/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,256,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6545/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,256,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6546/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,256,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6547/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,257,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6548/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,257,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6549/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,257,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6550/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,257,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6551/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,257,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6552/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,257,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6553/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,258,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6554/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,258,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6555/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,258,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6556/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,258,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6557/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,258,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6558/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,259,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6559/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,259,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6560/500000]
+ optim/total_grad_norm=7.098
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,259,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6561/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,259,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6562/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,259,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6563/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,260,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6564/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,260,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6565/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,260,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6566/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,260,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6567/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,260,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6568/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,261,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6569/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,261,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6570/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,261,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6571/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,261,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6572/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,261,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6573/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,262,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6574/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,262,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6575/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,262,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6576/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,262,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6577/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,262,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6578/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,262,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6579/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,263,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6580/500000]
+ optim/total_grad_norm=8.225
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,263,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6581/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,263,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6582/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,263,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6583/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,263,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6584/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,264,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6585/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,264,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6586/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,264,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6587/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,264,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6588/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,264,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6589/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,265,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6590/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,265,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6591/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,265,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6592/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,265,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6593/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,265,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6594/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,266,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6595/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,266,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6596/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,266,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6597/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,266,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6598/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,266,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6599/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,267,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6600/500000]
+ optim/total_grad_norm=7.892
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,267,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6601/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,267,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6602/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,267,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6603/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,267,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6604/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,267,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6605/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,268,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6606/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,268,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6607/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,268,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6608/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,268,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6609/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,268,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6610/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,269,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6611/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,269,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6612/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,269,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6613/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,269,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6614/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,269,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6615/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,270,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6616/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,270,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6617/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,270,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6618/500000]
+ train/ActionL1Loss=0.0340
+ throughput/total_tokens=1,270,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6619/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,270,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6620/500000]
+ optim/total_grad_norm=8.567
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,271,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6621/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,271,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6622/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,271,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6623/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,271,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6624/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,271,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6625/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,272,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6626/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,272,192,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6627/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=1,272,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6628/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,272,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6629/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,272,768,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6630/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,272,960,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6631/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,273,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6632/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,273,344,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6633/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,273,536,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6634/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,273,728,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6635/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,273,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6636/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=1,274,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6637/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,274,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6638/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,274,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6639/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,274,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6640/500000]
+ optim/total_grad_norm=8.991
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,274,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6641/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,275,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6642/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,275,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6643/500000]
+ train/ActionL1Loss=0.0371
+ throughput/total_tokens=1,275,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6644/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,275,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6645/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,275,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6646/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,276,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6647/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,276,224,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6648/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,276,416,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6649/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,276,608,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6650/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,276,800,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6651/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=1,276,992,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6652/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,277,184,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6653/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,277,376,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6654/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,277,568,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6655/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,277,760,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6656/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,277,952,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6657/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,278,144,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6658/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,278,336,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6659/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,278,528,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6660/500000]
+ optim/total_grad_norm=7.755
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,278,720,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6661/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,278,912,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6662/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,279,104,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6663/500000]
+ train/ActionL1Loss=0.0349
+ throughput/total_tokens=1,279,296,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6664/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,279,488,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6665/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,279,680,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6666/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,279,872,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6667/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,280,064,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6668/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,280,256,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6669/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,280,448,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6670/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,280,640,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6671/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,280,832,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6672/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,281,024,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6673/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,281,216,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6674/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,281,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6675/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,281,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6676/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,281,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6677/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,281,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6678/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,282,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6679/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,282,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6680/500000]
+ optim/total_grad_norm=6.613
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,282,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6681/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,282,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6682/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,282,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6683/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=1,283,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6684/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,283,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6685/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,283,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6686/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,283,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6687/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,283,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6688/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,284,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6689/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,284,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6690/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,284,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6691/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,284,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6692/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,284,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6693/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,285,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6694/500000]
+ train/ActionL1Loss=0.0435
+ throughput/total_tokens=1,285,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6695/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,285,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6696/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,285,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6697/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,285,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6698/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,286,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6699/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,286,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6700/500000]
+ optim/total_grad_norm=9.962
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,286,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6701/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,286,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6702/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,286,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6703/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,286,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6704/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,287,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6705/500000]
+ train/ActionL1Loss=0.0350
+ throughput/total_tokens=1,287,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6706/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=1,287,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6707/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,287,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6708/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,287,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6709/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,288,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6710/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,288,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6711/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,288,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6712/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,288,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6713/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,288,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6714/500000]
+ train/ActionL1Loss=0.0361
+ throughput/total_tokens=1,289,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6715/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,289,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6716/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,289,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6717/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,289,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6718/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,289,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6719/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,290,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6720/500000]
+ optim/total_grad_norm=6.731
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,290,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6721/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,290,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6722/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,290,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6723/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,290,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6724/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,291,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6725/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,291,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6726/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,291,392,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6727/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,291,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6728/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,291,776,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6729/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=1,291,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6730/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,292,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6731/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,292,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6732/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,292,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6733/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,292,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6734/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,292,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6735/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,293,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6736/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,293,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6737/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=1,293,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6738/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,293,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6739/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,293,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6740/500000]
+ optim/total_grad_norm=9.080
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,294,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6741/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,294,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6742/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,294,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6743/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,294,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6744/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,294,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6745/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,295,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6746/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=1,295,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6747/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,295,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6748/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,295,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6749/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,295,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6750/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,296,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6751/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,296,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6752/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,296,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6753/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=1,296,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6754/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,296,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6755/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,296,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6756/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,297,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6757/500000]
+ train/ActionL1Loss=0.0411
+ throughput/total_tokens=1,297,344,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6758/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,297,536,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6759/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,297,728,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6760/500000]
+ optim/total_grad_norm=8.064
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,297,920,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6761/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,298,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6762/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,298,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6763/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,298,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6764/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,298,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6765/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,298,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6766/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,299,072,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6767/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,299,264,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6768/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,299,456,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6769/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,299,648,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6770/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,299,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6771/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,300,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6772/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,300,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6773/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,300,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6774/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,300,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6775/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,300,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6776/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,300,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6777/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,301,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6778/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,301,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6779/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,301,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6780/500000]
+ optim/total_grad_norm=8.023
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,301,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6781/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,301,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6782/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,302,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6783/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,302,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6784/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,302,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6785/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,302,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6786/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,302,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6787/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,303,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6788/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,303,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6789/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,303,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6790/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,303,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6791/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,303,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6792/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,304,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6793/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,304,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6794/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,304,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6795/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,304,640,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6796/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,304,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6797/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,305,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6798/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,305,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6799/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,305,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6800/500000]
+ optim/total_grad_norm=8.973
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,305,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6801/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,305,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6802/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,305,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6803/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,306,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6804/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,306,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6805/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,306,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6806/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,306,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6807/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,306,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6808/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,307,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6809/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,307,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6810/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,307,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6811/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,307,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6812/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,307,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6813/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,308,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6814/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,308,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6815/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,308,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6816/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,308,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6817/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,308,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6818/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,309,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6819/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,309,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6820/500000]
+ optim/total_grad_norm=8.389
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,309,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6821/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,309,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6822/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,309,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6823/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,310,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6824/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,310,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6825/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,310,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6826/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,310,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6827/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,310,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6828/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,310,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6829/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,311,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6830/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,311,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6831/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,311,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6832/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,311,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6833/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,311,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6834/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,312,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6835/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,312,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6836/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,312,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6837/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,312,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6838/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,312,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6839/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,313,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6840/500000]
+ optim/total_grad_norm=8.343
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,313,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6841/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,313,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6842/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,313,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6843/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,313,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6844/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=1,314,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6845/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,314,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6846/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,314,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6847/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,314,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6848/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,314,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6849/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,315,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6850/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,315,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6851/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,315,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6852/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,315,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6853/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,315,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6854/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,315,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6855/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,316,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6856/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,316,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6857/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,316,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6858/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,316,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6859/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,316,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6860/500000]
+ optim/total_grad_norm=7.229
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,317,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6861/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,317,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6862/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,317,504,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6863/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=1,317,696,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6864/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,317,888,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6865/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,318,080,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=6866/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=1,318,272,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=6867/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=1,318,464,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6868/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,318,656,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6869/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,318,848,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=6870/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,319,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6871/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=1,319,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6872/500000]
+ train/ActionL1Loss=0.0364
+ throughput/total_tokens=1,319,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6873/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,319,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6874/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,319,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6875/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,320,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6876/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,320,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6877/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,320,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6878/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,320,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6879/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,320,768,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6880/500000]
+ optim/total_grad_norm=8.155
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,320,960,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6881/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,321,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6882/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,321,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6883/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,321,536,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6884/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,321,728,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6885/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,321,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6886/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,322,112,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6887/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,322,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6888/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,322,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6889/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,322,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6890/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,322,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6891/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,323,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6892/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,323,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6893/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,323,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6894/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,323,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6895/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,323,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6896/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,324,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6897/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,324,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6898/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,324,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6899/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,324,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6900/500000]
+ optim/total_grad_norm=8.206
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,324,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6901/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,324,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6902/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,325,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6903/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,325,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6904/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,325,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6905/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,325,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6906/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,325,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6907/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,326,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6908/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,326,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6909/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,326,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6910/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,326,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6911/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,326,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6912/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,327,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6913/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,327,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6914/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,327,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6915/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,327,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=6916/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,327,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=6917/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,328,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6918/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,328,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6919/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,328,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6920/500000]
+ optim/total_grad_norm=8.938
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,328,640,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6921/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,328,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6922/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,329,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6923/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,329,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6924/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,329,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6925/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,329,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6926/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,329,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6927/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,329,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6928/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,330,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=6929/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,330,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6930/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,330,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=6931/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,330,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6932/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,330,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6933/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,331,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6934/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,331,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=6935/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,331,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=6936/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,331,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6937/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,331,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6938/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,332,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6939/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,332,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6940/500000]
+ optim/total_grad_norm=8.566
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,332,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6941/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,332,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6942/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,332,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6943/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,333,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6944/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,333,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6945/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,333,440,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6946/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,333,632,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6947/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,333,824,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6948/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,334,016,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6949/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,334,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6950/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,334,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6951/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,334,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6952/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,334,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6953/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,334,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6954/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,335,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6955/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,335,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6956/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,335,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6957/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,335,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6958/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,335,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6959/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,336,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6960/500000]
+ optim/total_grad_norm=8.644
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,336,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=6961/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,336,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6962/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,336,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6963/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,336,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6964/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,337,088,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6965/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,337,280,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6966/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,337,472,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6967/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,337,664,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6968/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,337,856,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6969/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,338,048,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=6970/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,338,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6971/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,338,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6972/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,338,624,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6973/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,338,816,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6974/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,339,008,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6975/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,339,200,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6976/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,339,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6977/500000]
+ train/ActionL1Loss=0.0392
+ throughput/total_tokens=1,339,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6978/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,339,776,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6979/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,339,968,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6980/500000]
+ optim/total_grad_norm=9.881
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=1,340,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6981/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,340,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6982/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,340,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6983/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,340,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6984/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,340,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6985/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,341,120,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6986/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,341,312,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6987/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,341,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6988/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,341,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6989/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,341,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6990/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,342,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=6991/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,342,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=6992/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,342,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6993/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,342,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6994/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,342,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6995/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,343,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6996/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,343,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6997/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,343,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6998/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,343,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=6999/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,343,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7000/500000]
+ optim/total_grad_norm=9.226
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,344,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+10/04 [09:05:46] INFO | >> Saving config... checkpoint.py:608
+10/04 [09:06:22] INFO | >> Saving model state... checkpoint.py:796
+10/04 [09:07:31] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [09:09:00] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7001/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,344,192,000
+ throughput/device/tokens_per_second=1,221
+ throughput/device/batches_per_second=0.0509
+[step=7002/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,344,384,000
+ throughput/device/tokens_per_second=1,203
+ throughput/device/batches_per_second=0.0501
+[step=7003/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,344,576,000
+ throughput/device/tokens_per_second=1,197
+ throughput/device/batches_per_second=0.0499
+[step=7004/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=1,344,768,000
+ throughput/device/tokens_per_second=1,193
+ throughput/device/batches_per_second=0.0497
+[step=7005/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,344,960,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=7006/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,345,152,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=7007/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,345,344,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7008/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,345,536,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7009/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,345,728,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7010/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,345,920,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=7011/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,346,112,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7012/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,346,304,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7013/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,346,496,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=7014/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,346,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7015/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,346,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7016/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,347,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7017/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,347,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7018/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,347,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7019/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,347,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7020/500000]
+ optim/total_grad_norm=6.616
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,347,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7021/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,348,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7022/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,348,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7023/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,348,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7024/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,348,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7025/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,348,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7026/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,348,992,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7027/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,349,184,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7028/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,349,376,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7029/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,349,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7030/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,349,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7031/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,349,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7032/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,350,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7033/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,350,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7034/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,350,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7035/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,350,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7036/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,350,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7037/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,351,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7038/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,351,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7039/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,351,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7040/500000]
+ optim/total_grad_norm=9.150
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,351,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7041/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,351,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7042/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,352,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7043/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,352,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7044/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,352,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7045/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,352,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7046/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,352,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7047/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,353,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7048/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,353,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7049/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,353,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7050/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,353,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7051/500000]
+ train/ActionL1Loss=0.0383
+ throughput/total_tokens=1,353,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7052/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,353,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7053/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,354,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7054/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,354,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7055/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,354,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7056/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,354,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7057/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,354,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7058/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,355,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7059/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,355,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7060/500000]
+ optim/total_grad_norm=7.061
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,355,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7061/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,355,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7062/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,355,904,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7063/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,356,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7064/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,356,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7065/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,356,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7066/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,356,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7067/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,356,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7068/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,357,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7069/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,357,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7070/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,357,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7071/500000]
+ train/ActionL1Loss=0.0360
+ throughput/total_tokens=1,357,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7072/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,357,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7073/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,358,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7074/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,358,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7075/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,358,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7076/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,358,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7077/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,358,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7078/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,358,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7079/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,359,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7080/500000]
+ optim/total_grad_norm=8.328
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,359,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7081/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,359,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7082/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,359,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7083/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,359,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7084/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,360,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7085/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,360,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7086/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,360,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7087/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,360,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7088/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,360,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7089/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,361,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7090/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,361,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7091/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,361,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7092/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,361,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7093/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,361,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7094/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,362,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7095/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,362,240,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7096/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,362,432,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7097/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,362,624,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7098/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,362,816,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7099/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,363,008,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7100/500000]
+ optim/total_grad_norm=9.195
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,363,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7101/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,363,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7102/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,363,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7103/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,363,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7104/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,363,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7105/500000]
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,364,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7106/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,364,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7107/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,364,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7108/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,364,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7109/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,364,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7110/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,365,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7111/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,365,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7112/500000]
+ train/ActionL1Loss=0.0393
+ throughput/total_tokens=1,365,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7113/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,365,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7114/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,365,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7115/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,366,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7116/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,366,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7117/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,366,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7118/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,366,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7119/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,366,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7120/500000]
+ optim/total_grad_norm=7.966
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,367,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7121/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,367,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7122/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,367,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7123/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,367,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7124/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,367,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7125/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,368,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7126/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,368,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7127/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,368,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7128/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,368,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7129/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,368,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7130/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,368,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7131/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,369,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7132/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,369,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7133/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,369,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7134/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,369,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7135/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,369,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7136/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,370,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7137/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,370,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7138/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,370,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7139/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,370,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7140/500000]
+ optim/total_grad_norm=9.462
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,370,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7141/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,371,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7142/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,371,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7143/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,371,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7144/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,371,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7145/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,371,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7146/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,372,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7147/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,372,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7148/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,372,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7149/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,372,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7150/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,372,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7151/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,372,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7152/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,373,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7153/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,373,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7154/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,373,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7155/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,373,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7156/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,373,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7157/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,374,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7158/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,374,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7159/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,374,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7160/500000]
+ optim/total_grad_norm=6.522
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,374,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7161/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,374,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7162/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,375,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7163/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,375,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7164/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,375,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7165/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,375,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7166/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,375,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7167/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,376,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7168/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,376,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7169/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,376,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7170/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,376,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7171/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,376,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7172/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,377,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7173/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,377,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7174/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,377,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7175/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,377,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7176/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,377,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7177/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,377,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7178/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,378,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7179/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,378,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7180/500000]
+ optim/total_grad_norm=7.679
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,378,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7181/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,378,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7182/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,378,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7183/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,379,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7184/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,379,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7185/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,379,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7186/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,379,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7187/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,379,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7188/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,380,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7189/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,380,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7190/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,380,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7191/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,380,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7192/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,380,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7193/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,381,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7194/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,381,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7195/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,381,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7196/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,381,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7197/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,381,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7198/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,382,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7199/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,382,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7200/500000]
+ optim/total_grad_norm=7.251
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,382,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7201/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,382,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7202/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,382,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7203/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,382,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7204/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,383,168,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7205/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,383,360,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7206/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,383,552,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7207/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,383,744,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7208/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,383,936,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7209/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,384,128,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7210/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,384,320,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=7211/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,384,512,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7212/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,384,704,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7213/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,384,896,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7214/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,385,088,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7215/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,385,280,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7216/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,385,472,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7217/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,385,664,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7218/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,385,856,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7219/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,386,048,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7220/500000]
+ optim/total_grad_norm=8.537
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,386,240,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7221/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,386,432,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7222/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,386,624,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7223/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,386,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7224/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,387,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7225/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,387,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7226/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,387,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7227/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,387,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7228/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,387,776,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7229/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,387,968,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7230/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,388,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7231/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,388,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7232/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,388,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7233/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,388,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7234/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,388,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7235/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,389,120,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7236/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,389,312,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7237/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,389,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7238/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,389,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7239/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,389,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7240/500000]
+ optim/total_grad_norm=7.709
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,390,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7241/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,390,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7242/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,390,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7243/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,390,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7244/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,390,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7245/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,391,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7246/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,391,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7247/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,391,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7248/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,391,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7249/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,391,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7250/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,392,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7251/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,392,192,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7252/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,392,384,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7253/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,392,576,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7254/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,392,768,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7255/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,392,960,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7256/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,393,152,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7257/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,393,344,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7258/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,393,536,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7259/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,393,728,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7260/500000]
+ optim/total_grad_norm=9.448
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,393,920,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=7261/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,394,112,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7262/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,394,304,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7263/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,394,496,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7264/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,394,688,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7265/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,394,880,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7266/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,395,072,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7267/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,395,264,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7268/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,395,456,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7269/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,395,648,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7270/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,395,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7271/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,396,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7272/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,396,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7273/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,396,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7274/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,396,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7275/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,396,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7276/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,396,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7277/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,397,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7278/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,397,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7279/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,397,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7280/500000]
+ optim/total_grad_norm=9.096
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,397,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7281/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,397,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7282/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,398,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7283/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,398,336,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7284/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,398,528,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7285/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,398,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7286/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,398,912,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7287/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,399,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7288/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,399,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7289/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,399,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7290/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,399,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7291/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,399,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7292/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,400,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7293/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,400,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7294/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,400,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7295/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,400,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7296/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,400,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7297/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,401,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7298/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,401,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7299/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,401,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7300/500000]
+ optim/total_grad_norm=7.868
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,401,600,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7301/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,401,792,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7302/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,401,984,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7303/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,402,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7304/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,402,368,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7305/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,402,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7306/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,402,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7307/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,402,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7308/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,403,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7309/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,403,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7310/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,403,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7311/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,403,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7312/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,403,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7313/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,404,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7314/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,404,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7315/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,404,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7316/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,404,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7317/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,404,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7318/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,405,056,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7319/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,405,248,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7320/500000]
+ optim/total_grad_norm=7.367
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,405,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7321/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,405,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7322/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,405,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7323/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,406,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7324/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,406,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7325/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=1,406,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7326/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,406,592,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7327/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,406,784,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7328/500000]
+ train/ActionL1Loss=0.0363
+ throughput/total_tokens=1,406,976,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7329/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,407,168,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7330/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,407,360,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7331/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,407,552,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7332/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,407,744,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7333/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,407,936,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7334/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,408,128,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7335/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,408,320,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7336/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,408,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7337/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,408,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7338/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,408,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7339/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,409,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7340/500000]
+ optim/total_grad_norm=7.109
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,409,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7341/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,409,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7342/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,409,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7343/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,409,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7344/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,410,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7345/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,410,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7346/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,410,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7347/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,410,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7348/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=1,410,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7349/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,411,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7350/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,411,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7351/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,411,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7352/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,411,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7353/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,411,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7354/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,411,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7355/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,412,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7356/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,412,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7357/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,412,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7358/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,412,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7359/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,412,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7360/500000]
+ optim/total_grad_norm=8.932
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,413,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=7361/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,413,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7362/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,413,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7363/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,413,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7364/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,413,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7365/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,414,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7366/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,414,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7367/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,414,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7368/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,414,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7369/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,414,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7370/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,415,040,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7371/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,415,232,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7372/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,415,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7373/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,415,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7374/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,415,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7375/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,416,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7376/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,416,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7377/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,416,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7378/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,416,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7379/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,416,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7380/500000]
+ optim/total_grad_norm=7.050
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,416,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7381/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,417,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7382/500000]
+ train/ActionL1Loss=0.0359
+ throughput/total_tokens=1,417,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7383/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,417,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7384/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,417,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7385/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,417,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7386/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,418,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7387/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,418,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7388/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,418,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7389/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,418,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7390/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,418,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7391/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,419,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7392/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,419,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7393/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,419,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7394/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,419,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7395/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,419,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7396/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,420,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7397/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,420,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7398/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,420,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7399/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,420,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7400/500000]
+ optim/total_grad_norm=6.861
+ train/ActionL1Loss=0.0399
+ throughput/total_tokens=1,420,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7401/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,420,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7402/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,421,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7403/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,421,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7404/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,421,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7405/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,421,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7406/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,421,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7407/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,422,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7408/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,422,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7409/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,422,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7410/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,422,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=7411/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,422,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7412/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,423,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7413/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,423,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7414/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,423,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7415/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=1,423,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7416/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,423,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7417/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,424,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7418/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,424,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7419/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,424,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7420/500000]
+ optim/total_grad_norm=8.771
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,424,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7421/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,424,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7422/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,425,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7423/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,425,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7424/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,425,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7425/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,425,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7426/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,425,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7427/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,425,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7428/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,426,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7429/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,426,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7430/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,426,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7431/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,426,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7432/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,426,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7433/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,427,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7434/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,427,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7435/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,427,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7436/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,427,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7437/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,427,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7438/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,428,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7439/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,428,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7440/500000]
+ optim/total_grad_norm=7.547
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,428,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7441/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,428,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7442/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,428,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7443/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,429,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7444/500000]
+ train/ActionL1Loss=0.0426
+ throughput/total_tokens=1,429,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7445/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,429,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7446/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,429,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7447/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,429,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7448/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,430,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7449/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,430,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7450/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,430,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7451/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,430,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7452/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,430,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7453/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,430,976,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7454/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,431,168,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7455/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,431,360,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7456/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,431,552,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7457/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,431,744,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7458/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,431,936,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7459/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,432,128,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7460/500000]
+ optim/total_grad_norm=7.161
+ train/ActionL1Loss=0.0323
+ throughput/total_tokens=1,432,320,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=7461/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,432,512,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7462/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,432,704,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7463/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,432,896,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7464/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,433,088,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7465/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,433,280,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7466/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,433,472,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7467/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,433,664,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7468/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,433,856,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7469/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,434,048,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7470/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,434,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7471/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,434,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7472/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,434,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7473/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,434,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7474/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,435,008,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=7475/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,435,200,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=7476/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,435,392,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=7477/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,435,584,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=7478/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,435,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7479/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=1,435,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7480/500000]
+ optim/total_grad_norm=9.790
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,436,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7481/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,436,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7482/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,436,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7483/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,436,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7484/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,436,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7485/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,437,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7486/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,437,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7487/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,437,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7488/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,437,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7489/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,437,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7490/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,438,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7491/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,438,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7492/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,438,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7493/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,438,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7494/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,438,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7495/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,439,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7496/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,439,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7497/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,439,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7498/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,439,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7499/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,439,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7500/500000]
+ optim/total_grad_norm=8.847
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,440,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+10/04 [11:59:08] INFO | >> Saving config... checkpoint.py:608
+10/04 [11:59:52] INFO | >> Saving model state... checkpoint.py:796
+10/04 [12:01:03] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [12:02:34] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7501/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,440,192,000
+ throughput/device/tokens_per_second=1,219
+ throughput/device/batches_per_second=0.0508
+[step=7502/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,440,384,000
+ throughput/device/tokens_per_second=1,195
+ throughput/device/batches_per_second=0.0498
+[step=7503/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,440,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7504/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,440,768,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=7505/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,440,960,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=7506/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,441,152,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=7507/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,441,344,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7508/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,441,536,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7509/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,441,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7510/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,441,920,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=7511/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,442,112,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7512/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,442,304,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7513/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,442,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7514/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,442,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7515/500000]
+ train/ActionL1Loss=0.0413
+ throughput/total_tokens=1,442,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7516/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,443,072,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7517/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,443,264,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7518/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,443,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7519/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,443,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7520/500000]
+ optim/total_grad_norm=7.908
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,443,840,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=7521/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,444,032,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=7522/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,444,224,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7523/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,444,416,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7524/500000]
+ train/ActionL1Loss=0.0766
+ throughput/total_tokens=1,444,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7525/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,444,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7526/500000]
+ train/ActionL1Loss=0.0809
+ throughput/total_tokens=1,444,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7527/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,445,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7528/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,445,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7529/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,445,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7530/500000]
+ train/ActionL1Loss=0.0759
+ throughput/total_tokens=1,445,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7531/500000]
+ train/ActionL1Loss=0.0823
+ throughput/total_tokens=1,445,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7532/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,446,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7533/500000]
+ train/ActionL1Loss=0.0794
+ throughput/total_tokens=1,446,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7534/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,446,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7535/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,446,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7536/500000]
+ train/ActionL1Loss=0.1340
+ throughput/total_tokens=1,446,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7537/500000]
+ train/ActionL1Loss=0.0855
+ throughput/total_tokens=1,447,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7538/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,447,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7539/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,447,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7540/500000]
+ optim/total_grad_norm=8.682
+ train/ActionL1Loss=0.0398
+ throughput/total_tokens=1,447,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7541/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,447,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7542/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,448,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7543/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,448,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7544/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=1,448,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7545/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,448,640,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7546/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,448,832,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7547/500000]
+ train/ActionL1Loss=0.0560
+ throughput/total_tokens=1,449,024,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7548/500000]
+ train/ActionL1Loss=0.0524
+ throughput/total_tokens=1,449,216,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7549/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,449,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7550/500000]
+ train/ActionL1Loss=0.0542
+ throughput/total_tokens=1,449,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7551/500000]
+ train/ActionL1Loss=0.0453
+ throughput/total_tokens=1,449,792,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7552/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,449,984,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7553/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,450,176,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7554/500000]
+ train/ActionL1Loss=0.0356
+ throughput/total_tokens=1,450,368,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7555/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=1,450,560,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7556/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,450,752,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7557/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,450,944,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7558/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=1,451,136,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7559/500000]
+ train/ActionL1Loss=0.0370
+ throughput/total_tokens=1,451,328,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=7560/500000]
+ optim/total_grad_norm=7.789
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,451,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=7561/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,451,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7562/500000]
+ train/ActionL1Loss=0.0340
+ throughput/total_tokens=1,451,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7563/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=1,452,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7564/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,452,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7565/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,452,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7566/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,452,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7567/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,452,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7568/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,453,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7569/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,453,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7570/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,453,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7571/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,453,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7572/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,453,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7573/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,454,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7574/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,454,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7575/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,454,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7576/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,454,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7577/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,454,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7578/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,454,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7579/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,455,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7580/500000]
+ optim/total_grad_norm=6.858
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,455,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7581/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,455,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7582/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,455,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7583/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,455,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7584/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,456,128,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7585/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,456,320,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7586/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,456,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7587/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,456,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7588/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,456,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7589/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,457,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7590/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,457,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7591/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,457,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7592/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,457,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7593/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,457,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7594/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,458,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7595/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,458,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7596/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,458,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7597/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,458,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7598/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,458,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7599/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,459,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7600/500000]
+ optim/total_grad_norm=9.640
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,459,200,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7601/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,459,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7602/500000]
+ train/ActionL1Loss=0.0373
+ throughput/total_tokens=1,459,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7603/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,459,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7604/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,459,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7605/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,460,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7606/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,460,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7607/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,460,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7608/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,460,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7609/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,460,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7610/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,461,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7611/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,461,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7612/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,461,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7613/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,461,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7614/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,461,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7615/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,462,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7616/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,462,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7617/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,462,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7618/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,462,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7619/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,462,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7620/500000]
+ optim/total_grad_norm=6.785
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,463,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7621/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,463,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7622/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,463,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7623/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,463,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7624/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,463,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7625/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,464,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7626/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,464,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7627/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,464,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7628/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,464,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7629/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,464,768,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7630/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=1,464,960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7631/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,465,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7632/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,465,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7633/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,465,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7634/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,465,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7635/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,465,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7636/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,466,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7637/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,466,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7638/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,466,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7639/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,466,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7640/500000]
+ optim/total_grad_norm=9.000
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,466,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7641/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=1,467,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7642/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,467,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7643/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,467,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7644/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=1,467,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7645/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,467,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7646/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,468,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7647/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,468,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7648/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,468,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7649/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,468,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7650/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,468,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7651/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,468,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7652/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,469,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7653/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,469,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7654/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,469,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7655/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,469,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7656/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,469,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7657/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=1,470,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7658/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,470,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7659/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,470,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7660/500000]
+ optim/total_grad_norm=7.288
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,470,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7661/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,470,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7662/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,471,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7663/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,471,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7664/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,471,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7665/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,471,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7666/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,471,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7667/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,472,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7668/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,472,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7669/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,472,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7670/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,472,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7671/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,472,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7672/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,473,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7673/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,473,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7674/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,473,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7675/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,473,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7676/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,473,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7677/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,473,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7678/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,474,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7679/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,474,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7680/500000]
+ optim/total_grad_norm=7.442
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=1,474,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7681/500000]
+ train/ActionL1Loss=0.0341
+ throughput/total_tokens=1,474,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7682/500000]
+ train/ActionL1Loss=0.0379
+ throughput/total_tokens=1,474,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7683/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,475,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7684/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,475,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7685/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,475,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7686/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,475,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7687/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,475,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7688/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,476,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7689/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,476,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7690/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,476,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7691/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,476,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7692/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,476,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7693/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,477,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7694/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,477,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7695/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,477,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7696/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,477,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7697/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,477,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7698/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,478,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7699/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,478,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7700/500000]
+ optim/total_grad_norm=8.015
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,478,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7701/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,478,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7702/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,478,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7703/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,478,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7704/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,479,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7705/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,479,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7706/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,479,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7707/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,479,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7708/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,479,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7709/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,480,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7710/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,480,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7711/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,480,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7712/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,480,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7713/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,480,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7714/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,481,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7715/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,481,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7716/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,481,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7717/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,481,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7718/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,481,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7719/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,482,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7720/500000]
+ optim/total_grad_norm=7.474
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,482,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7721/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,482,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7722/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,482,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7723/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,482,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7724/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,483,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7725/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,483,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7726/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,483,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7727/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,483,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7728/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,483,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7729/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,483,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7730/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,484,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7731/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,484,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7732/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,484,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7733/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,484,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7734/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,484,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7735/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,485,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7736/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=1,485,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7737/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,485,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7738/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,485,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7739/500000]
+ train/ActionL1Loss=0.0339
+ throughput/total_tokens=1,485,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7740/500000]
+ optim/total_grad_norm=7.876
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,486,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7741/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,486,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7742/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,486,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7743/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,486,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7744/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,486,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7745/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,487,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7746/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,487,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7747/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,487,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7748/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,487,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7749/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,487,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7750/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,488,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7751/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,488,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7752/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,488,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7753/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,488,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7754/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,488,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7755/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,488,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7756/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,489,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7757/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,489,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7758/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,489,536,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7759/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,489,728,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7760/500000]
+ optim/total_grad_norm=7.003
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,489,920,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7761/500000]
+ train/ActionL1Loss=0.0322
+ throughput/total_tokens=1,490,112,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7762/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,490,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7763/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,490,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7764/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,490,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7765/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,490,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7766/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,491,072,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7767/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,491,264,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7768/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,491,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7769/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,491,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7770/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,491,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7771/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,492,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7772/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,492,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7773/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,492,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7774/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,492,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7775/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,492,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7776/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,492,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7777/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,493,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7778/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,493,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7779/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,493,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7780/500000]
+ optim/total_grad_norm=8.539
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,493,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7781/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,493,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7782/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,494,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7783/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,494,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7784/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,494,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7785/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,494,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7786/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,494,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7787/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,495,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7788/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,495,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7789/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,495,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7790/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,495,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7791/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,495,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7792/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,496,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7793/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,496,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7794/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,496,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7795/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,496,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7796/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,496,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7797/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,497,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7798/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,497,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7799/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,497,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7800/500000]
+ optim/total_grad_norm=8.735
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,497,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7801/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,497,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7802/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,497,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7803/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,498,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7804/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,498,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7805/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,498,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7806/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,498,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7807/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,498,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7808/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,499,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7809/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,499,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7810/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,499,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7811/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,499,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7812/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,499,904,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7813/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,500,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7814/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,500,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7815/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,500,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7816/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,500,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7817/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,500,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7818/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,501,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7819/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,501,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7820/500000]
+ optim/total_grad_norm=7.529
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,501,440,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=7821/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,501,632,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7822/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,501,824,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7823/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,502,016,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7824/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,502,208,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7825/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,502,400,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7826/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,502,592,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=7827/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,502,784,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7828/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,502,976,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7829/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,503,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7830/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,503,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7831/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,503,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7832/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,503,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7833/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,503,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7834/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,504,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7835/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,504,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7836/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,504,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7837/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,504,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7838/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,504,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7839/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,505,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7840/500000]
+ optim/total_grad_norm=6.562
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,505,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7841/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,505,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7842/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,505,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7843/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,505,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7844/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,506,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7845/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,506,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7846/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,506,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=7847/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,506,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7848/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,506,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7849/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,507,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7850/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,507,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7851/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,507,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7852/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,507,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7853/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,507,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7854/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,507,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7855/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,508,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7856/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,508,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7857/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,508,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7858/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,508,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7859/500000]
+ train/ActionL1Loss=0.0358
+ throughput/total_tokens=1,508,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7860/500000]
+ optim/total_grad_norm=6.935
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,509,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7861/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,509,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7862/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,509,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7863/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,509,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7864/500000]
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,509,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7865/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,510,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7866/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,510,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7867/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,510,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7868/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,510,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7869/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,510,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7870/500000]
+ train/ActionL1Loss=0.0319
+ throughput/total_tokens=1,511,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7871/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,511,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7872/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,511,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7873/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,511,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7874/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,511,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7875/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,512,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7876/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,512,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7877/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,512,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7878/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,512,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7879/500000]
+ train/ActionL1Loss=0.0471
+ throughput/total_tokens=1,512,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7880/500000]
+ optim/total_grad_norm=8.009
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,512,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7881/500000]
+ train/ActionL1Loss=0.0385
+ throughput/total_tokens=1,513,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7882/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,513,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7883/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,513,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7884/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,513,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7885/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,513,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7886/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=1,514,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7887/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,514,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7888/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,514,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7889/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,514,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7890/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,514,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7891/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,515,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7892/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=1,515,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7893/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,515,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7894/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,515,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7895/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,515,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7896/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,516,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7897/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,516,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7898/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,516,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7899/500000]
+ train/ActionL1Loss=0.0369
+ throughput/total_tokens=1,516,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7900/500000]
+ optim/total_grad_norm=9.447
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,516,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7901/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,516,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7902/500000]
+ train/ActionL1Loss=0.0332
+ throughput/total_tokens=1,517,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7903/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,517,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7904/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,517,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=7905/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,517,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7906/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,517,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7907/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,518,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7908/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,518,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7909/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,518,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7910/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,518,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7911/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,518,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7912/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,519,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7913/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,519,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7914/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,519,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7915/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,519,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7916/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,519,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7917/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,520,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7918/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,520,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=7919/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,520,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7920/500000]
+ optim/total_grad_norm=7.656
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,520,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7921/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,520,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7922/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,521,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7923/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,521,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7924/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,521,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7925/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,521,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7926/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,521,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7927/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,521,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7928/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,522,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7929/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,522,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7930/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,522,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7931/500000]
+ train/ActionL1Loss=0.0397
+ throughput/total_tokens=1,522,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7932/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,522,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7933/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,523,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7934/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,523,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7935/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,523,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7936/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,523,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7937/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,523,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7938/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,524,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7939/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,524,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7940/500000]
+ optim/total_grad_norm=7.896
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,524,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7941/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,524,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7942/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,524,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7943/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,525,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7944/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,525,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7945/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,525,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7946/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,525,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7947/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,525,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7948/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,526,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7949/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,526,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7950/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,526,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7951/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,526,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7952/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,526,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7953/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,526,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7954/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,527,168,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7955/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,527,360,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7956/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,527,552,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7957/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,527,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7958/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,527,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7959/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,528,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7960/500000]
+ optim/total_grad_norm=6.945
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,528,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=7961/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,528,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=7962/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,528,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7963/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,528,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7964/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,529,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7965/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,529,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7966/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,529,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7967/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,529,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7968/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,529,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7969/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,530,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=7970/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,530,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7971/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,530,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7972/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,530,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7973/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,530,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7974/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,531,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7975/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,531,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7976/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,531,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7977/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,531,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7978/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,531,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7979/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,531,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7980/500000]
+ optim/total_grad_norm=7.773
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,532,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7981/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,532,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7982/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,532,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7983/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,532,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7984/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,532,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7985/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,533,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7986/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,533,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7987/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,533,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7988/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,533,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7989/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,533,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7990/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,534,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=7991/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,534,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=7992/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,534,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7993/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,534,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7994/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=1,534,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7995/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,535,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7996/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,535,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7997/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,535,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7998/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=1,535,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=7999/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,535,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8000/500000]
+ optim/total_grad_norm=8.047
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,536,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/04 [14:52:39] INFO | >> Saving config... checkpoint.py:608
+10/04 [14:53:27] INFO | >> Saving model state... checkpoint.py:796
+10/04 [14:54:37] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [14:56:09] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8001/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,536,192,000
+ throughput/device/tokens_per_second=1,221
+ throughput/device/batches_per_second=0.0509
+[step=8002/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,536,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8003/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,536,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8004/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,536,768,000
+ throughput/device/tokens_per_second=1,157
+ throughput/device/batches_per_second=0.0482
+[step=8005/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,536,960,000
+ throughput/device/tokens_per_second=1,163
+ throughput/device/batches_per_second=0.0485
+[step=8006/500000]
+ train/ActionL1Loss=0.0340
+ throughput/total_tokens=1,537,152,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=8007/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,537,344,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=8008/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,537,536,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=8009/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,537,728,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=8010/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,537,920,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+ System/Peak GPU Memory (MB)=46,917
+[step=8011/500000]
+ train/ActionL1Loss=0.0376
+ throughput/total_tokens=1,538,112,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=8012/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,538,304,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=8013/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,538,496,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=8014/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,538,688,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=8015/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,538,880,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=8016/500000]
+ train/ActionL1Loss=0.0389
+ throughput/total_tokens=1,539,072,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=8017/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,539,264,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=8018/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,539,456,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=8019/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,539,648,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=8020/500000]
+ optim/total_grad_norm=7.135
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,539,840,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=8021/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,540,032,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=8022/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,540,224,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=8023/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,540,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8024/500000]
+ train/ActionL1Loss=0.0396
+ throughput/total_tokens=1,540,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8025/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,540,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8026/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,540,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8027/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,541,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8028/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,541,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8029/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,541,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8030/500000]
+ train/ActionL1Loss=0.0448
+ throughput/total_tokens=1,541,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8031/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,541,952,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8032/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,542,144,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8033/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,542,336,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8034/500000]
+ train/ActionL1Loss=0.0347
+ throughput/total_tokens=1,542,528,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8035/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,542,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8036/500000]
+ train/ActionL1Loss=0.0382
+ throughput/total_tokens=1,542,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8037/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,543,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8038/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,543,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8039/500000]
+ train/ActionL1Loss=0.0336
+ throughput/total_tokens=1,543,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8040/500000]
+ optim/total_grad_norm=9.519
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,543,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8041/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,543,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8042/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,544,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8043/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,544,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8044/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,544,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8045/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,544,640,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8046/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,544,832,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8047/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,545,024,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8048/500000]
+ train/ActionL1Loss=0.0354
+ throughput/total_tokens=1,545,216,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8049/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,545,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8050/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,545,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8051/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,545,792,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8052/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,545,984,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8053/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,546,176,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8054/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,546,368,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8055/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,546,560,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8056/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,546,752,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8057/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,546,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8058/500000]
+ train/ActionL1Loss=0.0390
+ throughput/total_tokens=1,547,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8059/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,547,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8060/500000]
+ optim/total_grad_norm=9.272
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,547,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=8061/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,547,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8062/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,547,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8063/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,548,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8064/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,548,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8065/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,548,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8066/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,548,672,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8067/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,548,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8068/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,549,056,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8069/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,549,248,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8070/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,549,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8071/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,549,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8072/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,549,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8073/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,550,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8074/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,550,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8075/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,550,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8076/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,550,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8077/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,550,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8078/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,550,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8079/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,551,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8080/500000]
+ optim/total_grad_norm=7.922
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,551,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8081/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,551,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8082/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,551,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8083/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,551,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8084/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,552,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8085/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,552,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8086/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,552,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8087/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,552,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8088/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,552,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8089/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,553,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8090/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,553,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8091/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,553,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8092/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,553,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8093/500000]
+ train/ActionL1Loss=0.0305
+ throughput/total_tokens=1,553,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8094/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,554,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8095/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,554,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8096/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,554,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8097/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,554,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8098/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,554,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8099/500000]
+ train/ActionL1Loss=0.0388
+ throughput/total_tokens=1,555,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8100/500000]
+ optim/total_grad_norm=8.736
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,555,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8101/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,555,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8102/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,555,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8103/500000]
+ train/ActionL1Loss=0.0316
+ throughput/total_tokens=1,555,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8104/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,555,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8105/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,556,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8106/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,556,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8107/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,556,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8108/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,556,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8109/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,556,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8110/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,557,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8111/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,557,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8112/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,557,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8113/500000]
+ train/ActionL1Loss=0.0355
+ throughput/total_tokens=1,557,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8114/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,557,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8115/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,558,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8116/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,558,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8117/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,558,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8118/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,558,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8119/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,558,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8120/500000]
+ optim/total_grad_norm=8.172
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,559,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8121/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,559,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8122/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,559,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8123/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,559,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8124/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,559,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8125/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,560,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8126/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,560,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8127/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,560,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8128/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,560,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8129/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,560,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8130/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,560,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8131/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,561,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8132/500000]
+ train/ActionL1Loss=0.0381
+ throughput/total_tokens=1,561,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8133/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,561,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8134/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,561,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8135/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,561,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8136/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,562,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8137/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,562,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8138/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,562,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8139/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,562,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8140/500000]
+ optim/total_grad_norm=5.859
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,562,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8141/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,563,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8142/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,563,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8143/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,563,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8144/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,563,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8145/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,563,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8146/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,564,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8147/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=1,564,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8148/500000]
+ train/ActionL1Loss=0.0375
+ throughput/total_tokens=1,564,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8149/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,564,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8150/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,564,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8151/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,564,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8152/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,565,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8153/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,565,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8154/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,565,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8155/500000]
+ train/ActionL1Loss=0.0320
+ throughput/total_tokens=1,565,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8156/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,565,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8157/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,566,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8158/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,566,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8159/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,566,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8160/500000]
+ optim/total_grad_norm=8.542
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,566,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8161/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,566,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8162/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,567,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8163/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,567,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8164/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=1,567,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8165/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,567,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8166/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,567,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8167/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,568,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8168/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,568,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8169/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,568,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8170/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,568,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8171/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,568,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8172/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,569,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8173/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,569,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8174/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,569,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8175/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,569,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8176/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,569,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8177/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,569,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8178/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,570,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8179/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,570,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8180/500000]
+ optim/total_grad_norm=7.846
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,570,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8181/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,570,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8182/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,570,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8183/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,571,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8184/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,571,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8185/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,571,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8186/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,571,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8187/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,571,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8188/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,572,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8189/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,572,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8190/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,572,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8191/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,572,672,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8192/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,572,864,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8193/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,573,056,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8194/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,573,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8195/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,573,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8196/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,573,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8197/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,573,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8198/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,574,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8199/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,574,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8200/500000]
+ optim/total_grad_norm=6.720
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,574,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8201/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,574,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8202/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,574,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8203/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,574,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8204/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=1,575,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8205/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,575,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8206/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,575,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8207/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,575,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8208/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,575,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8209/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,576,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8210/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,576,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=8211/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,576,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8212/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,576,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8213/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,576,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8214/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,577,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8215/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,577,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8216/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,577,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8217/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,577,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8218/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,577,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8219/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,578,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8220/500000]
+ optim/total_grad_norm=7.127
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,578,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8221/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,578,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8222/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,578,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8223/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,578,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8224/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,579,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8225/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,579,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8226/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,579,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8227/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,579,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8228/500000]
+ train/ActionL1Loss=0.0329
+ throughput/total_tokens=1,579,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8229/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,579,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8230/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,580,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8231/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,580,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8232/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,580,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8233/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,580,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8234/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,580,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8235/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,581,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8236/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,581,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8237/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,581,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8238/500000]
+ train/ActionL1Loss=0.0346
+ throughput/total_tokens=1,581,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8239/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,581,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8240/500000]
+ optim/total_grad_norm=8.483
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,582,080,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8241/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,582,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8242/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=1,582,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8243/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,582,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8244/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,582,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8245/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,583,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8246/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,583,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8247/500000]
+ train/ActionL1Loss=0.0352
+ throughput/total_tokens=1,583,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8248/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,583,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8249/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,583,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8250/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,584,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8251/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,584,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8252/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,584,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8253/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,584,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8254/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,584,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8255/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,584,960,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8256/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,585,152,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8257/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,585,344,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8258/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,585,536,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8259/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,585,728,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8260/500000]
+ optim/total_grad_norm=7.384
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,585,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8261/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,586,112,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8262/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,586,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8263/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,586,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8264/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,586,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8265/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,586,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8266/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,587,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8267/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,587,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8268/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,587,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8269/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,587,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8270/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,587,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8271/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,588,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8272/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,588,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8273/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,588,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8274/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,588,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8275/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,588,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8276/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,588,992,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8277/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,589,184,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8278/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,589,376,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8279/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,589,568,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8280/500000]
+ optim/total_grad_norm=7.994
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,589,760,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8281/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,589,952,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8282/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,590,144,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8283/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,590,336,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8284/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,590,528,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8285/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,590,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8286/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,590,912,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8287/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,591,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8288/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,591,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8289/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,591,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8290/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,591,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8291/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,591,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8292/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,592,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8293/500000]
+ train/ActionL1Loss=0.0327
+ throughput/total_tokens=1,592,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8294/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,592,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8295/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,592,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8296/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,592,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8297/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,593,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8298/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,593,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8299/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,593,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8300/500000]
+ optim/total_grad_norm=8.975
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,593,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8301/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,593,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8302/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,593,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8303/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,594,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8304/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,594,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8305/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,594,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8306/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,594,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8307/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,594,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8308/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,595,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8309/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,595,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8310/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,595,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8311/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,595,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8312/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,595,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8313/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,596,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8314/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,596,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8315/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,596,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8316/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,596,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8317/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,596,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8318/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,597,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8319/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,597,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8320/500000]
+ optim/total_grad_norm=7.887
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,597,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8321/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,597,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8322/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,597,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8323/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,598,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8324/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=1,598,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8325/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,598,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8326/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,598,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8327/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,598,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8328/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,598,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8329/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,599,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8330/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,599,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8331/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,599,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8332/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,599,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8333/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,599,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8334/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,600,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8335/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,600,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8336/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,600,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8337/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,600,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8338/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,600,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8339/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,601,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8340/500000]
+ optim/total_grad_norm=5.843
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,601,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8341/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,601,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8342/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=1,601,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8343/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,601,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8344/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,602,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8345/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,602,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8346/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,602,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8347/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,602,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8348/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,602,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8349/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,603,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8350/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,603,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8351/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,603,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8352/500000]
+ train/ActionL1Loss=0.0324
+ throughput/total_tokens=1,603,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8353/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,603,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8354/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,603,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8355/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,604,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8356/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,604,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8357/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,604,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8358/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,604,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8359/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,604,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8360/500000]
+ optim/total_grad_norm=8.771
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,605,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8361/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,605,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8362/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,605,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8363/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,605,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8364/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,605,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8365/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,606,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8366/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,606,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8367/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,606,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8368/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,606,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8369/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,606,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8370/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,607,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8371/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,607,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8372/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,607,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8373/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,607,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8374/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,607,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8375/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,608,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8376/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,608,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8377/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,608,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8378/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,608,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8379/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,608,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8380/500000]
+ optim/total_grad_norm=8.711
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,608,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8381/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,609,152,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8382/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,609,344,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8383/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,609,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8384/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,609,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8385/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,609,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8386/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,610,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8387/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,610,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8388/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,610,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8389/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,610,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8390/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,610,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8391/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,611,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8392/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,611,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8393/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,611,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8394/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,611,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8395/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,611,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8396/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,612,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8397/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,612,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8398/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,612,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8399/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,612,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8400/500000]
+ optim/total_grad_norm=8.995
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,612,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8401/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,612,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8402/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,613,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8403/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,613,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8404/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,613,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8405/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,613,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8406/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,613,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8407/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,614,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8408/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,614,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8409/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,614,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8410/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,614,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=8411/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,614,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8412/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,615,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8413/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,615,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8414/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,615,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8415/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,615,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8416/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,615,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8417/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,616,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8418/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,616,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8419/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,616,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8420/500000]
+ optim/total_grad_norm=9.000
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,616,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8421/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,616,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8422/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,617,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8423/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,617,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8424/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,617,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8425/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,617,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8426/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,617,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8427/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,617,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8428/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,618,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8429/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,618,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8430/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,618,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8431/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,618,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8432/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,618,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8433/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,619,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8434/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,619,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8435/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,619,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8436/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,619,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8437/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,619,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8438/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,620,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8439/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,620,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8440/500000]
+ optim/total_grad_norm=7.173
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,620,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8441/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,620,672,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8442/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,620,864,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8443/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,621,056,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8444/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,621,248,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8445/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,621,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8446/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,621,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8447/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,621,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8448/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,622,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8449/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,622,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8450/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,622,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8451/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,622,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8452/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,622,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8453/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,622,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8454/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,623,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8455/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,623,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8456/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,623,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8457/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,623,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8458/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,623,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8459/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,624,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8460/500000]
+ optim/total_grad_norm=7.361
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,624,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=8461/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,624,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8462/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,624,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8463/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,624,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8464/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,625,088,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8465/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,625,280,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8466/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,625,472,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8467/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,625,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8468/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,625,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8469/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,626,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8470/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,626,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8471/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,626,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8472/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,626,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8473/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,626,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8474/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=1,627,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8475/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,627,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8476/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,627,392,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8477/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,627,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8478/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,627,776,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8479/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,627,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8480/500000]
+ optim/total_grad_norm=8.620
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,628,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8481/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,628,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8482/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,628,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8483/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,628,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8484/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,628,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8485/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,629,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8486/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,629,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8487/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,629,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8488/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,629,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8489/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,629,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8490/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,630,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8491/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,630,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8492/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,630,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8493/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,630,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8494/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,630,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8495/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,631,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8496/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,631,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8497/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,631,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8498/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,631,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8499/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,631,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8500/500000]
+ optim/total_grad_norm=5.791
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,632,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/04 [17:46:20] INFO | >> Saving config... checkpoint.py:608
+10/04 [17:46:57] INFO | >> Saving model state... checkpoint.py:796
+10/04 [17:48:06] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [17:49:38] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8501/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,632,192,000
+ throughput/device/tokens_per_second=1,218
+ throughput/device/batches_per_second=0.0508
+[step=8502/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,632,384,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=8503/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,632,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8504/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,632,768,000
+ throughput/device/tokens_per_second=1,161
+ throughput/device/batches_per_second=0.0484
+[step=8505/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,632,960,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0486
+[step=8506/500000]
+ train/ActionL1Loss=0.0353
+ throughput/total_tokens=1,633,152,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=8507/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,633,344,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=8508/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,633,536,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=8509/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,633,728,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=8510/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,633,920,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=8511/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,634,112,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=8512/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,634,304,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=8513/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,634,496,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=8514/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,634,688,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=8515/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=1,634,880,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=8516/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,635,072,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=8517/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,635,264,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=8518/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,635,456,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=8519/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,635,648,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8520/500000]
+ optim/total_grad_norm=8.249
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,635,840,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=8521/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,636,032,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=8522/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,636,224,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8523/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,636,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8524/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,636,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8525/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,636,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8526/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,636,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8527/500000]
+ train/ActionL1Loss=0.0310
+ throughput/total_tokens=1,637,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8528/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,637,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8529/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,637,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8530/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,637,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8531/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,637,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8532/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,638,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8533/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,638,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8534/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,638,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8535/500000]
+ train/ActionL1Loss=0.0357
+ throughput/total_tokens=1,638,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8536/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,638,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8537/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,639,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8538/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,639,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8539/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,639,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8540/500000]
+ optim/total_grad_norm=7.448
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,639,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8541/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,639,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8542/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,640,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8543/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,640,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8544/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,640,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8545/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,640,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8546/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,640,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8547/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,641,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8548/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,641,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8549/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,641,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8550/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,641,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8551/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,641,792,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8552/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,641,984,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=8553/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,642,176,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=8554/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,642,368,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=8555/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,642,560,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=8556/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,642,752,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8557/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,642,944,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8558/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,643,136,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8559/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,643,328,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8560/500000]
+ optim/total_grad_norm=8.153
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,643,520,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=8561/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,643,712,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8562/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,643,904,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8563/500000]
+ train/ActionL1Loss=0.0313
+ throughput/total_tokens=1,644,096,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8564/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,644,288,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8565/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,644,480,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8566/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,644,672,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8567/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,644,864,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8568/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,645,056,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8569/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,645,248,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=8570/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,645,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8571/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,645,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8572/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,645,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8573/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,646,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8574/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,646,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8575/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,646,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8576/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,646,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8577/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,646,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8578/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,646,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8579/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,647,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8580/500000]
+ optim/total_grad_norm=7.720
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,647,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8581/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,647,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8582/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,647,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8583/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,647,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8584/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,648,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8585/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,648,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8586/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,648,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8587/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,648,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8588/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,648,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8589/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,649,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8590/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,649,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8591/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,649,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8592/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,649,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8593/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,649,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8594/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,650,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8595/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,650,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8596/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,650,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8597/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,650,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8598/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,650,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8599/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,651,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8600/500000]
+ optim/total_grad_norm=7.501
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,651,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8601/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,651,392,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8602/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,651,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8603/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,651,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8604/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,651,968,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8605/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,652,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8606/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,652,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8607/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,652,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8608/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,652,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8609/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,652,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8610/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,653,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8611/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,653,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8612/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,653,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8613/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,653,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8614/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,653,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8615/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,654,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8616/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,654,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8617/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,654,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8618/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,654,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8619/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,654,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8620/500000]
+ optim/total_grad_norm=8.494
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,655,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8621/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,655,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8622/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,655,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8623/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,655,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8624/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,655,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8625/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,656,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8626/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,656,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8627/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,656,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8628/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,656,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8629/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,656,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8630/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,656,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8631/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,657,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8632/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,657,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8633/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,657,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8634/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,657,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8635/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,657,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8636/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,658,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8637/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,658,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8638/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,658,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8639/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,658,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8640/500000]
+ optim/total_grad_norm=6.222
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,658,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8641/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,659,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8642/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,659,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8643/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,659,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8644/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,659,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8645/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,659,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8646/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,660,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8647/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,660,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8648/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,660,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8649/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,660,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8650/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,660,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8651/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,660,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8652/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,661,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8653/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,661,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8654/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,661,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8655/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,661,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8656/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,661,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8657/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,662,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8658/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,662,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8659/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,662,528,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8660/500000]
+ optim/total_grad_norm=9.053
+ train/ActionL1Loss=0.0325
+ throughput/total_tokens=1,662,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8661/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,662,912,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8662/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=1,663,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8663/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,663,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8664/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,663,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8665/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,663,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8666/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,663,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8667/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,664,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8668/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,664,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8669/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,664,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8670/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,664,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8671/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,664,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8672/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,665,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8673/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,665,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8674/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,665,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8675/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,665,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8676/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,665,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8677/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,665,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8678/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,666,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8679/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,666,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8680/500000]
+ optim/total_grad_norm=8.540
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,666,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8681/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,666,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8682/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,666,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8683/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,667,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8684/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,667,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8685/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,667,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8686/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,667,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8687/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,667,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8688/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,668,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8689/500000]
+ train/ActionL1Loss=0.0315
+ throughput/total_tokens=1,668,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8690/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,668,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8691/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,668,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8692/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,668,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8693/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,669,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8694/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,669,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8695/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,669,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8696/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,669,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8697/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,669,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8698/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,670,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8699/500000]
+ train/ActionL1Loss=0.0367
+ throughput/total_tokens=1,670,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8700/500000]
+ optim/total_grad_norm=7.712
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,670,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8701/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,670,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8702/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,670,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8703/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,670,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8704/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,671,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8705/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,671,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8706/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,671,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8707/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,671,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8708/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,671,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8709/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,672,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8710/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,672,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=8711/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,672,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8712/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,672,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8713/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,672,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8714/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,673,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8715/500000]
+ train/ActionL1Loss=0.0330
+ throughput/total_tokens=1,673,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8716/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,673,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8717/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,673,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8718/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,673,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8719/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,674,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8720/500000]
+ optim/total_grad_norm=7.103
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,674,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8721/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,674,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8722/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,674,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8723/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,674,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8724/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,675,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8725/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,675,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8726/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,675,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8727/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,675,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8728/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,675,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8729/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,675,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8730/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,676,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8731/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,676,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8732/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,676,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8733/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,676,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8734/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,676,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8735/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,677,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8736/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,677,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8737/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,677,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8738/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,677,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8739/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,677,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8740/500000]
+ optim/total_grad_norm=7.496
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,678,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8741/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,678,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8742/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,678,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8743/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,678,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8744/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,678,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8745/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,679,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8746/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,679,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8747/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,679,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8748/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,679,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8749/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,679,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8750/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,680,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8751/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,680,192,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8752/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,680,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8753/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,680,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8754/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,680,768,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8755/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,680,960,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8756/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,681,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8757/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,681,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8758/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,681,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8759/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,681,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8760/500000]
+ optim/total_grad_norm=10.26
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,681,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8761/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,682,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8762/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,682,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8763/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,682,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8764/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,682,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8765/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,682,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8766/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,683,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8767/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,683,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8768/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,683,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8769/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,683,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8770/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,683,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8771/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,684,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8772/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,684,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8773/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,684,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8774/500000]
+ train/ActionL1Loss=0.0287
+ throughput/total_tokens=1,684,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8775/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,684,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8776/500000]
+ train/ActionL1Loss=0.0387
+ throughput/total_tokens=1,684,992,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8777/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=1,685,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8778/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,685,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8779/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,685,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8780/500000]
+ optim/total_grad_norm=9.592
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,685,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8781/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,685,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8782/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,686,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8783/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,686,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8784/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,686,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8785/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,686,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8786/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,686,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8787/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,687,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8788/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,687,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8789/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,687,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8790/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,687,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8791/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,687,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8792/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,688,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8793/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,688,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8794/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,688,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8795/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,688,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8796/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,688,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8797/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,689,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8798/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,689,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8799/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,689,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8800/500000]
+ optim/total_grad_norm=8.397
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,689,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8801/500000]
+ train/ActionL1Loss=0.0343
+ throughput/total_tokens=1,689,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8802/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,689,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8803/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=1,690,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8804/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,690,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8805/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,690,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8806/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,690,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8807/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,690,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8808/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,691,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8809/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,691,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8810/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,691,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8811/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,691,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8812/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,691,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8813/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,692,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8814/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,692,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8815/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,692,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8816/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,692,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8817/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,692,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8818/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,693,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=8819/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,693,248,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8820/500000]
+ optim/total_grad_norm=6.360
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=1,693,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8821/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,693,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8822/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,693,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8823/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,694,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8824/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,694,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8825/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,694,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8826/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,694,592,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8827/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,694,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8828/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,694,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8829/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,695,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8830/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,695,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8831/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,695,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8832/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,695,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8833/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,695,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8834/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,696,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8835/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,696,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8836/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,696,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8837/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,696,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8838/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,696,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8839/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,697,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8840/500000]
+ optim/total_grad_norm=8.920
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,697,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8841/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,697,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8842/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,697,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8843/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,697,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8844/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,698,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8845/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,698,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8846/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,698,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8847/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,698,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8848/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,698,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8849/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,699,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8850/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,699,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8851/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,699,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8852/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,699,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8853/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,699,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8854/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,699,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8855/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,700,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=8856/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,700,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8857/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,700,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8858/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,700,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8859/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,700,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8860/500000]
+ optim/total_grad_norm=7.119
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,701,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=8861/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,701,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8862/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,701,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8863/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,701,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8864/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,701,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8865/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,702,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8866/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,702,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8867/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,702,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8868/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,702,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8869/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,702,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=8870/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,703,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8871/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,703,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8872/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,703,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8873/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,703,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8874/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,703,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8875/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,704,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8876/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,704,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8877/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=1,704,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8878/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,704,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8879/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,704,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8880/500000]
+ optim/total_grad_norm=6.962
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,704,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8881/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,705,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8882/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,705,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8883/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,705,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8884/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,705,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8885/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,705,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8886/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,706,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8887/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,706,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8888/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,706,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8889/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,706,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8890/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,706,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8891/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,707,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8892/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,707,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8893/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,707,456,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=8894/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,707,648,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8895/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,707,840,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8896/500000]
+ train/ActionL1Loss=0.0345
+ throughput/total_tokens=1,708,032,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8897/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,708,224,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8898/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,708,416,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8899/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,708,608,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8900/500000]
+ optim/total_grad_norm=7.136
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,708,800,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=8901/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,708,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8902/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,709,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8903/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,709,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8904/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,709,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8905/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,709,760,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8906/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,709,952,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8907/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,710,144,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8908/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,710,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8909/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,710,528,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8910/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,710,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=8911/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,710,912,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8912/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,711,104,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8913/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,711,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8914/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,711,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8915/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,711,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8916/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,711,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8917/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,712,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8918/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,712,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8919/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,712,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=8920/500000]
+ optim/total_grad_norm=8.578
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,712,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8921/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,712,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8922/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,713,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8923/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,713,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8924/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,713,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8925/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,713,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8926/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,713,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8927/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,713,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8928/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,714,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8929/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,714,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8930/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,714,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8931/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,714,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8932/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,714,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8933/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,715,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8934/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,715,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8935/500000]
+ train/ActionL1Loss=0.0366
+ throughput/total_tokens=1,715,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8936/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,715,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8937/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,715,904,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=8938/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,716,096,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=8939/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,716,288,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8940/500000]
+ optim/total_grad_norm=10.57
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,716,480,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=8941/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,716,672,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8942/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,716,864,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8943/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,717,056,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8944/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,717,248,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8945/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,717,440,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8946/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,717,632,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8947/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,717,824,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8948/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,718,016,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8949/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,718,208,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8950/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,718,400,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=8951/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,718,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8952/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,718,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8953/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,718,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8954/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,719,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8955/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,719,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8956/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=1,719,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8957/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,719,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8958/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,719,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8959/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,720,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8960/500000]
+ optim/total_grad_norm=7.981
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,720,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8961/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,720,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8962/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,720,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8963/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,720,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8964/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,721,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8965/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,721,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8966/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,721,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8967/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,721,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8968/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,721,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=8969/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,722,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=8970/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,722,240,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=8971/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,722,432,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8972/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,722,624,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8973/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,722,816,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8974/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,723,008,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=8975/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,723,200,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=8976/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,723,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8977/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,723,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8978/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,723,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8979/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,723,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8980/500000]
+ optim/total_grad_norm=9.302
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,724,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8981/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,724,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8982/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,724,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8983/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,724,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8984/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,724,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8985/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,725,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8986/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,725,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8987/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,725,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8988/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,725,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8989/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,725,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8990/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,726,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=8991/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,726,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=8992/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,726,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8993/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,726,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8994/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,726,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8995/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,727,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8996/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,727,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8997/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,727,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8998/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,727,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=8999/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,727,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9000/500000]
+ optim/total_grad_norm=9.112
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,728,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/04 [20:39:38] INFO | >> Saving config... checkpoint.py:608
+10/04 [20:40:22] INFO | >> Saving model state... checkpoint.py:796
+10/04 [20:41:40] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [20:43:12] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9001/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,728,192,000
+ throughput/device/tokens_per_second=1,215
+ throughput/device/batches_per_second=0.0506
+[step=9002/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,728,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9003/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,728,576,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9004/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,728,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9005/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,728,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9006/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,729,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9007/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,729,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9008/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,729,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9009/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,729,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9010/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,729,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9011/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,730,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9012/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,730,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9013/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,730,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9014/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,730,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9015/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,730,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9016/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,731,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9017/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,731,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9018/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,731,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9019/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,731,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9020/500000]
+ optim/total_grad_norm=7.431
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,731,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9021/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,732,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9022/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,732,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9023/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,732,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9024/500000]
+ train/ActionL1Loss=0.0351
+ throughput/total_tokens=1,732,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9025/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,732,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9026/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,732,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9027/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,733,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9028/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,733,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9029/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,733,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9030/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,733,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9031/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,733,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9032/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,734,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9033/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,734,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9034/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,734,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9035/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,734,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9036/500000]
+ train/ActionL1Loss=0.0318
+ throughput/total_tokens=1,734,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9037/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,735,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9038/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,735,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9039/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,735,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9040/500000]
+ optim/total_grad_norm=8.617
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,735,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9041/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,735,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9042/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,736,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9043/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,736,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9044/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,736,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9045/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,736,640,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9046/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,736,832,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9047/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,737,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9048/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,737,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9049/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,737,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9050/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,737,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9051/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,737,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9052/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,737,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9053/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,738,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9054/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,738,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9055/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,738,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9056/500000]
+ train/ActionL1Loss=0.0348
+ throughput/total_tokens=1,738,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9057/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,738,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9058/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,739,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9059/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,739,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9060/500000]
+ optim/total_grad_norm=9.046
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,739,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=9061/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,739,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9062/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,739,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9063/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,740,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9064/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,740,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9065/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,740,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9066/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,740,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9067/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,740,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9068/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,741,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9069/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,741,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9070/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,741,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9071/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,741,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9072/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,741,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9073/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,742,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9074/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,742,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9075/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,742,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9076/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,742,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9077/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,742,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9078/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,742,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9079/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=1,743,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9080/500000]
+ optim/total_grad_norm=9.055
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,743,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9081/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,743,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9082/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,743,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9083/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,743,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9084/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,744,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9085/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,744,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9086/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,744,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9087/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,744,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9088/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,744,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9089/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,745,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9090/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,745,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9091/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,745,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9092/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,745,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9093/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=1,745,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9094/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,746,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9095/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,746,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9096/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,746,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9097/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,746,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9098/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,746,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9099/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,747,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9100/500000]
+ optim/total_grad_norm=8.474
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,747,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9101/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,747,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9102/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,747,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9103/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,747,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9104/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,747,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9105/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,748,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9106/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,748,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9107/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,748,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9108/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,748,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9109/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,748,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9110/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,749,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=9111/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,749,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9112/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,749,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9113/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,749,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9114/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,749,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9115/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,750,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9116/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,750,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9117/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,750,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9118/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,750,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9119/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,750,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9120/500000]
+ optim/total_grad_norm=7.706
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,751,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9121/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,751,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9122/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,751,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9123/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,751,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9124/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,751,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9125/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,752,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9126/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,752,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9127/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,752,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9128/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=1,752,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9129/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,752,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9130/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,752,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9131/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,753,152,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9132/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,753,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9133/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,753,536,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9134/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,753,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9135/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,753,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9136/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,754,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9137/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,754,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9138/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,754,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9139/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,754,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9140/500000]
+ optim/total_grad_norm=7.036
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,754,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9141/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,755,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9142/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,755,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9143/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,755,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9144/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,755,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9145/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,755,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9146/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,756,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9147/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,756,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9148/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,756,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9149/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,756,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9150/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,756,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9151/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,756,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9152/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,757,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9153/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,757,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9154/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,757,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9155/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,757,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9156/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=1,757,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9157/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,758,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9158/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,758,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9159/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,758,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9160/500000]
+ optim/total_grad_norm=8.619
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,758,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9161/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,758,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9162/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,759,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9163/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,759,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9164/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,759,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9165/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,759,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9166/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,759,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9167/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,760,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9168/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,760,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9169/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,760,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9170/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,760,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9171/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,760,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9172/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,761,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9173/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,761,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9174/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,761,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9175/500000]
+ train/ActionL1Loss=0.0334
+ throughput/total_tokens=1,761,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9176/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,761,792,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9177/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,761,984,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9178/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,762,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9179/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,762,368,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9180/500000]
+ optim/total_grad_norm=8.387
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,762,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9181/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,762,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9182/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,762,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9183/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,763,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9184/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,763,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9185/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,763,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9186/500000]
+ train/ActionL1Loss=0.0335
+ throughput/total_tokens=1,763,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9187/500000]
+ train/ActionL1Loss=0.0328
+ throughput/total_tokens=1,763,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9188/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,764,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9189/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,764,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9190/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,764,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9191/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,764,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9192/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,764,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9193/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,765,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9194/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,765,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9195/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,765,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9196/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,765,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9197/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,765,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9198/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,766,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9199/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,766,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9200/500000]
+ optim/total_grad_norm=6.936
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,766,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9201/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,766,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9202/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,766,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9203/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,766,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9204/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,767,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9205/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,767,360,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9206/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,767,552,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9207/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,767,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9208/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,767,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9209/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,768,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9210/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,768,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9211/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,768,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9212/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,768,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9213/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,768,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9214/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,769,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9215/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,769,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9216/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,769,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9217/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,769,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9218/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,769,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9219/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,770,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9220/500000]
+ optim/total_grad_norm=6.709
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,770,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9221/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,770,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9222/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,770,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9223/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,770,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9224/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,771,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9225/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,771,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9226/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,771,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9227/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,771,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9228/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,771,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9229/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,771,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9230/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,772,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9231/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,772,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9232/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,772,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9233/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,772,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9234/500000]
+ train/ActionL1Loss=0.0309
+ throughput/total_tokens=1,772,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9235/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,773,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9236/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,773,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9237/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,773,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9238/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,773,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9239/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,773,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9240/500000]
+ optim/total_grad_norm=8.225
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,774,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9241/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,774,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9242/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,774,464,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=9243/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,774,656,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=9244/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,774,848,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=9245/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,775,040,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=9246/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,775,232,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=9247/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,775,424,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=9248/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,775,616,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=9249/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,775,808,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=9250/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,776,000,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=9251/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,776,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9252/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,776,384,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9253/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,776,576,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9254/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,776,768,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9255/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,776,960,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9256/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,777,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9257/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,777,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9258/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,777,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9259/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,777,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9260/500000]
+ optim/total_grad_norm=8.772
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=1,777,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9261/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,778,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9262/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,778,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9263/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,778,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9264/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,778,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9265/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,778,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9266/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,779,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9267/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=1,779,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9268/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,779,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9269/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,779,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9270/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,779,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9271/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,780,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9272/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,780,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9273/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,780,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9274/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,780,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9275/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,780,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9276/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,780,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9277/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,781,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9278/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,781,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9279/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,781,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9280/500000]
+ optim/total_grad_norm=6.670
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,781,760,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9281/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=1,781,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9282/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,782,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9283/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,782,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9284/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=1,782,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9285/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,782,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9286/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,782,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9287/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,783,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9288/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,783,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9289/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,783,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9290/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,783,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9291/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=1,783,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9292/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,784,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9293/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,784,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9294/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,784,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9295/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,784,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9296/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,784,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9297/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,785,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9298/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,785,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9299/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,785,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9300/500000]
+ optim/total_grad_norm=8.748
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,785,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9301/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,785,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9302/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,785,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9303/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,786,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9304/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,786,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9305/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,786,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9306/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,786,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9307/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,786,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9308/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,787,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9309/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,787,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9310/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,787,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9311/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,787,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9312/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,787,904,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9313/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,788,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9314/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,788,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9315/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,788,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9316/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,788,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9317/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,788,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9318/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,789,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9319/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,789,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9320/500000]
+ optim/total_grad_norm=5.708
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,789,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9321/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,789,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9322/500000]
+ train/ActionL1Loss=0.0312
+ throughput/total_tokens=1,789,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9323/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,790,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9324/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,790,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9325/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,790,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9326/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,790,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9327/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,790,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9328/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,790,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9329/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,791,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9330/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,791,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9331/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,791,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9332/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,791,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9333/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,791,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9334/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,792,128,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9335/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,792,320,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9336/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,792,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9337/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,792,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9338/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,792,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9339/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,793,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9340/500000]
+ optim/total_grad_norm=9.806
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,793,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9341/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=1,793,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9342/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,793,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9343/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,793,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9344/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,794,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9345/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=1,794,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9346/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,794,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9347/500000]
+ train/ActionL1Loss=0.0344
+ throughput/total_tokens=1,794,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9348/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,794,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9349/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,795,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9350/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,795,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9351/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,795,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9352/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,795,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9353/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,795,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9354/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,795,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9355/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,796,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9356/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,796,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9357/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,796,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9358/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,796,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9359/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,796,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9360/500000]
+ optim/total_grad_norm=9.723
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,797,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9361/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,797,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9362/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,797,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9363/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,797,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9364/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,797,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9365/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,798,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9366/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,798,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9367/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,798,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9368/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,798,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9369/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,798,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9370/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=1,799,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9371/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,799,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9372/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,799,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9373/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,799,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9374/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,799,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9375/500000]
+ train/ActionL1Loss=0.0155
+ throughput/total_tokens=1,800,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9376/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=1,800,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9377/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,800,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9378/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,800,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9379/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,800,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9380/500000]
+ optim/total_grad_norm=7.990
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,800,960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9381/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,801,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9382/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,801,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9383/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,801,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9384/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,801,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9385/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,801,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9386/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,802,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9387/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,802,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9388/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,802,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9389/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,802,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9390/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,802,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9391/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,803,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9392/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,803,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9393/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,803,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9394/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,803,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9395/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,803,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9396/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,804,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9397/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,804,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9398/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,804,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9399/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,804,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9400/500000]
+ optim/total_grad_norm=7.917
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,804,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9401/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,804,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9402/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,805,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9403/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,805,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9404/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,805,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9405/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,805,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9406/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,805,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9407/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,806,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9408/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,806,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9409/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,806,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9410/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,806,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9411/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,806,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9412/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,807,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9413/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,807,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9414/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,807,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9415/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,807,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9416/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,807,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9417/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,808,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9418/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,808,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9419/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,808,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9420/500000]
+ optim/total_grad_norm=9.348
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,808,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9421/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,808,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9422/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,809,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9423/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,809,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9424/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=1,809,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9425/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,809,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9426/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,809,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9427/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,809,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9428/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,810,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9429/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,810,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9430/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,810,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9431/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,810,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9432/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,810,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9433/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,811,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9434/500000]
+ train/ActionL1Loss=0.0331
+ throughput/total_tokens=1,811,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9435/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=1,811,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9436/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,811,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9437/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,811,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9438/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,812,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9439/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,812,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9440/500000]
+ optim/total_grad_norm=7.894
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,812,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9441/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,812,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9442/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=1,812,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9443/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,813,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9444/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,813,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9445/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,813,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9446/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,813,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9447/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,813,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9448/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,814,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9449/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,814,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9450/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,814,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9451/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,814,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9452/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=1,814,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9453/500000]
+ train/ActionL1Loss=0.0301
+ throughput/total_tokens=1,814,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9454/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,815,168,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9455/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,815,360,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9456/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,815,552,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9457/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,815,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9458/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,815,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9459/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,816,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9460/500000]
+ optim/total_grad_norm=7.768
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,816,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9461/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,816,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9462/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,816,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9463/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,816,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9464/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,817,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9465/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,817,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9466/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,817,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9467/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,817,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9468/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,817,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9469/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,818,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9470/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,818,240,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9471/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,818,432,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=9472/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,818,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9473/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,818,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9474/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,819,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9475/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,819,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9476/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,819,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9477/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,819,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9478/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,819,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9479/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,819,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9480/500000]
+ optim/total_grad_norm=8.862
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,820,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9481/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,820,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9482/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,820,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9483/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,820,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9484/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,820,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9485/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,821,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9486/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,821,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9487/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,821,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9488/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,821,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9489/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,821,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9490/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=1,822,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9491/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,822,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9492/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,822,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9493/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,822,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9494/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,822,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9495/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,823,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9496/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,823,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9497/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,823,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9498/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,823,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9499/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=1,823,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9500/500000]
+ optim/total_grad_norm=7.765
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,824,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/04 [23:33:20] INFO | >> Saving config... checkpoint.py:608
+10/04 [23:33:58] INFO | >> Saving model state... checkpoint.py:796
+10/04 [23:35:08] INFO | >> Saving optim state... checkpoint.py:811
+10/04 [23:36:41] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9501/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,824,192,000
+ throughput/device/tokens_per_second=1,224
+ throughput/device/batches_per_second=0.0510
+[step=9502/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,824,384,000
+ throughput/device/tokens_per_second=1,198
+ throughput/device/batches_per_second=0.0499
+[step=9503/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,824,576,000
+ throughput/device/tokens_per_second=1,194
+ throughput/device/batches_per_second=0.0498
+[step=9504/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=1,824,768,000
+ throughput/device/tokens_per_second=1,192
+ throughput/device/batches_per_second=0.0497
+[step=9505/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,824,960,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0497
+[step=9506/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,825,152,000
+ throughput/device/tokens_per_second=1,191
+ throughput/device/batches_per_second=0.0496
+[step=9507/500000]
+ train/ActionL1Loss=0.0333
+ throughput/total_tokens=1,825,344,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=9508/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,825,536,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=9509/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,825,728,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=9510/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,825,920,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=9511/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,826,112,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=9512/500000]
+ train/ActionL1Loss=0.0149
+ throughput/total_tokens=1,826,304,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=9513/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,826,496,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=9514/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,826,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9515/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,826,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9516/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,827,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9517/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,827,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9518/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,827,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9519/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,827,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9520/500000]
+ optim/total_grad_norm=6.293
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,827,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9521/500000]
+ train/ActionL1Loss=0.0150
+ throughput/total_tokens=1,828,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9522/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,828,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9523/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,828,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9524/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,828,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9525/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,828,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9526/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,828,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9527/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,829,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9528/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,829,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9529/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,829,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9530/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,829,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9531/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,829,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9532/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,830,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9533/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,830,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9534/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=1,830,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9535/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,830,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9536/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,830,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9537/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,831,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9538/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,831,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9539/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,831,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9540/500000]
+ optim/total_grad_norm=6.744
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,831,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9541/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,831,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9542/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,832,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9543/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,832,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9544/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,832,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9545/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,832,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9546/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,832,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9547/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,833,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9548/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,833,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9549/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,833,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9550/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,833,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9551/500000]
+ train/ActionL1Loss=0.0155
+ throughput/total_tokens=1,833,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9552/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,833,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9553/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,834,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9554/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,834,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9555/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,834,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9556/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,834,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9557/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,834,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9558/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,835,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9559/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,835,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9560/500000]
+ optim/total_grad_norm=7.297
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,835,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9561/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,835,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9562/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,835,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9563/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,836,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9564/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,836,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9565/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,836,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9566/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,836,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9567/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,836,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9568/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,837,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9569/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,837,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9570/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,837,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9571/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,837,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9572/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,837,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9573/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,838,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9574/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,838,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9575/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,838,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9576/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,838,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9577/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,838,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9578/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,838,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9579/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,839,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9580/500000]
+ optim/total_grad_norm=8.697
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,839,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9581/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,839,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9582/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,839,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9583/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,839,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9584/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=1,840,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9585/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,840,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9586/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,840,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9587/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,840,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9588/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,840,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9589/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,841,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9590/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,841,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9591/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,841,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9592/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,841,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9593/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,841,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9594/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,842,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9595/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,842,240,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9596/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,842,432,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9597/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,842,624,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9598/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,842,816,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9599/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,843,008,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9600/500000]
+ optim/total_grad_norm=7.872
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=1,843,200,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9601/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,843,392,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=9602/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,843,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9603/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,843,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9604/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,843,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9605/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=1,844,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9606/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,844,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9607/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,844,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9608/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,844,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9609/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,844,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9610/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,845,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=9611/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,845,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9612/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,845,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9613/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,845,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9614/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,845,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9615/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,846,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9616/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,846,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9617/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=1,846,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9618/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,846,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9619/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,846,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9620/500000]
+ optim/total_grad_norm=9.186
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,847,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9621/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,847,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9622/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=1,847,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9623/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=1,847,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9624/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,847,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9625/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,848,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9626/500000]
+ train/ActionL1Loss=0.0308
+ throughput/total_tokens=1,848,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9627/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,848,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9628/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,848,576,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9629/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,848,768,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9630/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,848,960,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9631/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,849,152,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9632/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,849,344,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9633/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,849,536,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9634/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,849,728,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9635/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,849,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9636/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,850,112,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9637/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=1,850,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9638/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,850,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9639/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,850,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9640/500000]
+ optim/total_grad_norm=6.414
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,850,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9641/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,851,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9642/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,851,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9643/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,851,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9644/500000]
+ train/ActionL1Loss=0.0290
+ throughput/total_tokens=1,851,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9645/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,851,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9646/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,852,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9647/500000]
+ train/ActionL1Loss=0.0283
+ throughput/total_tokens=1,852,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9648/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,852,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9649/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,852,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9650/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,852,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9651/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=1,852,992,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9652/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,853,184,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9653/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,853,376,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9654/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,853,568,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9655/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,853,760,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9656/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,853,952,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9657/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,854,144,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9658/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,854,336,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9659/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=1,854,528,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9660/500000]
+ optim/total_grad_norm=6.676
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,854,720,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=9661/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,854,912,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9662/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,855,104,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9663/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,855,296,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9664/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=1,855,488,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9665/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,855,680,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9666/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,855,872,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9667/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,856,064,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=9668/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,856,256,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=9669/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,856,448,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=9670/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,856,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9671/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,856,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9672/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,857,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9673/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,857,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9674/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,857,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9675/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,857,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9676/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,857,792,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9677/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,857,984,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9678/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,858,176,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9679/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,858,368,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9680/500000]
+ optim/total_grad_norm=8.892
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,858,560,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9681/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,858,752,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9682/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,858,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9683/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,859,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9684/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,859,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9685/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,859,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9686/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,859,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9687/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=1,859,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9688/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,860,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9689/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=1,860,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9690/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,860,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9691/500000]
+ train/ActionL1Loss=0.0156
+ throughput/total_tokens=1,860,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9692/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,860,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9693/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,861,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9694/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,861,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9695/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,861,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9696/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,861,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9697/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,861,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9698/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,862,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9699/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,862,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9700/500000]
+ optim/total_grad_norm=8.757
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,862,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9701/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,862,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9702/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,862,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9703/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,862,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9704/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,863,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9705/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,863,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9706/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,863,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9707/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,863,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9708/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,863,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9709/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,864,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9710/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,864,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=9711/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,864,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9712/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,864,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9713/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,864,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9714/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,865,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9715/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,865,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9716/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,865,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9717/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,865,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9718/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,865,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9719/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,866,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9720/500000]
+ optim/total_grad_norm=6.600
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,866,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9721/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,866,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9722/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,866,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9723/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,866,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9724/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,867,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9725/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,867,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9726/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,867,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9727/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,867,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9728/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,867,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9729/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,867,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9730/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=1,868,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9731/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,868,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9732/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,868,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9733/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,868,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9734/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,868,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9735/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,869,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9736/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,869,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9737/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,869,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9738/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,869,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9739/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,869,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9740/500000]
+ optim/total_grad_norm=8.361
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,870,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9741/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,870,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9742/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,870,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9743/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,870,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9744/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,870,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9745/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,871,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9746/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,871,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9747/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,871,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9748/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,871,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9749/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,871,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9750/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,872,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9751/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,872,192,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9752/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,872,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9753/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,872,576,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9754/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,872,768,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9755/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,872,960,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9756/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,873,152,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9757/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,873,344,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9758/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,873,536,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9759/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,873,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9760/500000]
+ optim/total_grad_norm=8.431
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,873,920,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=9761/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,874,112,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9762/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,874,304,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9763/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,874,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9764/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,874,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9765/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=1,874,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9766/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,875,072,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9767/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,875,264,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9768/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,875,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9769/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=1,875,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9770/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,875,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9771/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,876,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9772/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,876,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9773/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,876,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9774/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,876,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9775/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,876,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9776/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,876,992,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9777/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,877,184,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9778/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,877,376,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9779/500000]
+ train/ActionL1Loss=0.0277
+ throughput/total_tokens=1,877,568,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9780/500000]
+ optim/total_grad_norm=8.137
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,877,760,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9781/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,877,952,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9782/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=1,878,144,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9783/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,878,336,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9784/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,878,528,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9785/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,878,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9786/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,878,912,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9787/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,879,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9788/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,879,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9789/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,879,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9790/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=1,879,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9791/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,879,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9792/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,880,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9793/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,880,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9794/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,880,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9795/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,880,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9796/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,880,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=9797/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,881,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9798/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,881,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9799/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,881,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9800/500000]
+ optim/total_grad_norm=8.607
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,881,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9801/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,881,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9802/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,881,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9803/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,882,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9804/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,882,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9805/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,882,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9806/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,882,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9807/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,882,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9808/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,883,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9809/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,883,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9810/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,883,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=9811/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,883,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9812/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,883,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9813/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,884,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9814/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,884,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9815/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,884,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9816/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,884,672,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9817/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,884,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9818/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,885,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9819/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,885,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9820/500000]
+ optim/total_grad_norm=7.490
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,885,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9821/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,885,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9822/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,885,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9823/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,886,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9824/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,886,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9825/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,886,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9826/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,886,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9827/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,886,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9828/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=1,886,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9829/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,887,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9830/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=1,887,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9831/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,887,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9832/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,887,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9833/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,887,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9834/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,888,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9835/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,888,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=9836/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,888,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9837/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,888,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9838/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,888,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9839/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,889,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9840/500000]
+ optim/total_grad_norm=9.024
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,889,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9841/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,889,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9842/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,889,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9843/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,889,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9844/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,890,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9845/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=1,890,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9846/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=1,890,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9847/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,890,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9848/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,890,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9849/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=1,891,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9850/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=1,891,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9851/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,891,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9852/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,891,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9853/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,891,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9854/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,891,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9855/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,892,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9856/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,892,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9857/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,892,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9858/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,892,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9859/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,892,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9860/500000]
+ optim/total_grad_norm=8.500
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,893,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9861/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,893,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9862/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,893,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9863/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,893,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9864/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,893,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9865/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,894,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9866/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,894,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9867/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,894,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9868/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,894,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9869/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,894,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9870/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,895,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9871/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,895,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9872/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,895,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9873/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,895,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9874/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,895,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9875/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,896,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9876/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,896,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9877/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,896,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9878/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,896,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9879/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=1,896,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9880/500000]
+ optim/total_grad_norm=8.926
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,896,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9881/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,897,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9882/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,897,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9883/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,897,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9884/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,897,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9885/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,897,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9886/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,898,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9887/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,898,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9888/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,898,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9889/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,898,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9890/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,898,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9891/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,899,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9892/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,899,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9893/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=1,899,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9894/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,899,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9895/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,899,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9896/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,900,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9897/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,900,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9898/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,900,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9899/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,900,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9900/500000]
+ optim/total_grad_norm=9.825
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,900,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9901/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,900,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9902/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,901,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9903/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,901,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9904/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,901,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9905/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=1,901,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9906/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,901,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9907/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,902,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9908/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,902,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9909/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,902,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9910/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=1,902,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9911/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,902,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9912/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,903,104,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9913/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,903,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9914/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,903,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9915/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,903,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9916/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,903,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9917/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,904,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9918/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,904,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9919/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,904,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=9920/500000]
+ optim/total_grad_norm=7.618
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=1,904,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9921/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,904,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9922/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,905,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9923/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=1,905,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9924/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,905,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9925/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,905,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9926/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,905,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9927/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,905,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9928/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,906,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9929/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,906,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9930/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,906,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9931/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,906,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9932/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,906,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9933/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,907,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9934/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,907,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9935/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=1,907,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9936/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,907,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9937/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,907,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9938/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,908,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9939/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,908,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9940/500000]
+ optim/total_grad_norm=8.257
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,908,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9941/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,908,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9942/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=1,908,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9943/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,909,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9944/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,909,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9945/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,909,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9946/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,909,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9947/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,909,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9948/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,910,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9949/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,910,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9950/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=1,910,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9951/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=1,910,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9952/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=1,910,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9953/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,910,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9954/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,911,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9955/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,911,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9956/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,911,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9957/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,911,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9958/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,911,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9959/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,912,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9960/500000]
+ optim/total_grad_norm=7.100
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,912,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=9961/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,912,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9962/500000]
+ train/ActionL1Loss=0.0303
+ throughput/total_tokens=1,912,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9963/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,912,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9964/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=1,913,088,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9965/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,913,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9966/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,913,472,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=9967/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=1,913,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9968/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,913,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9969/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,914,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=9970/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,914,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9971/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,914,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9972/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=1,914,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9973/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,914,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9974/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,915,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9975/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,915,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9976/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,915,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9977/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,915,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9978/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,915,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9979/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,915,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9980/500000]
+ optim/total_grad_norm=7.332
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,916,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=9981/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,916,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9982/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,916,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=9983/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,916,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9984/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,916,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9985/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,917,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9986/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,917,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9987/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,917,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9988/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,917,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9989/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=1,917,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9990/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,918,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=9991/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,918,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9992/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,918,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9993/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,918,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9994/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,918,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9995/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,919,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9996/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,919,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=9997/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=1,919,424,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9998/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=1,919,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=9999/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,919,808,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10000/500000]
+ optim/total_grad_norm=9.298
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,920,000,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+10/05 [02:27:01] INFO | >> Saving config... checkpoint.py:608
+10/05 [02:27:44] INFO | >> Saving model state... checkpoint.py:796
+10/05 [02:28:55] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [02:30:26] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10001/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,920,192,000
+ throughput/device/tokens_per_second=1,224
+ throughput/device/batches_per_second=0.0510
+[step=10002/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,920,384,000
+ throughput/device/tokens_per_second=1,203
+ throughput/device/batches_per_second=0.0501
+[step=10003/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,920,576,000
+ throughput/device/tokens_per_second=1,192
+ throughput/device/batches_per_second=0.0497
+[step=10004/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,920,768,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10005/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,920,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10006/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,921,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10007/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,921,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10008/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,921,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10009/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=1,921,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10010/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=1,921,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10011/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,922,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10012/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=1,922,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10013/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=1,922,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10014/500000]
+ train/ActionL1Loss=0.0160
+ throughput/total_tokens=1,922,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10015/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,922,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10016/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,923,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10017/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,923,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10018/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,923,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10019/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,923,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10020/500000]
+ optim/total_grad_norm=7.613
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,923,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10021/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,924,032,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10022/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=1,924,224,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10023/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,924,416,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10024/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=1,924,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10025/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,924,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10026/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,924,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10027/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,925,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10028/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,925,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10029/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=1,925,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10030/500000]
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=1,925,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10031/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,925,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10032/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,926,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10033/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,926,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10034/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=1,926,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10035/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=1,926,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10036/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,926,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10037/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,927,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10038/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,927,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10039/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,927,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10040/500000]
+ optim/total_grad_norm=6.874
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,927,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10041/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,927,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10042/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,928,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10043/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,928,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10044/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,928,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10045/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,928,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10046/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,928,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10047/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,929,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10048/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,929,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10049/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,929,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10050/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,929,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10051/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=1,929,792,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=10052/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,929,984,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=10053/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,930,176,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=10054/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,930,368,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=10055/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,930,560,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0490
+[step=10056/500000]
+ train/ActionL1Loss=0.0279
+ throughput/total_tokens=1,930,752,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10057/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,930,944,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10058/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,931,136,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10059/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,931,328,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10060/500000]
+ optim/total_grad_norm=8.851
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,931,520,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+ System/Peak GPU Memory (MB)=46,917
+[step=10061/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,931,712,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10062/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,931,904,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10063/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,932,096,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10064/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,932,288,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10065/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,932,480,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10066/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=1,932,672,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10067/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,932,864,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10068/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=1,933,056,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10069/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,933,248,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10070/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,933,440,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=10071/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,933,632,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10072/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,933,824,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10073/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,934,016,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10074/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,934,208,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10075/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,934,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10076/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,934,592,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10077/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,934,784,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10078/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,934,976,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10079/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,935,168,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10080/500000]
+ optim/total_grad_norm=8.060
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=1,935,360,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10081/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,935,552,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10082/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,935,744,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10083/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,935,936,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10084/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,936,128,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10085/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,936,320,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10086/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,936,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10087/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,936,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10088/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=1,936,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10089/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,937,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10090/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,937,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10091/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,937,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10092/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,937,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10093/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,937,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10094/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=1,938,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10095/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,938,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10096/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,938,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10097/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,938,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10098/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,938,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10099/500000]
+ train/ActionL1Loss=0.0302
+ throughput/total_tokens=1,939,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10100/500000]
+ optim/total_grad_norm=8.807
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,939,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10101/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,939,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10102/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,939,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10103/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,939,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10104/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,939,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10105/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,940,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10106/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,940,352,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10107/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,940,544,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10108/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,940,736,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10109/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,940,928,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10110/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,941,120,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=10111/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,941,312,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10112/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,941,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10113/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,941,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10114/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,941,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10115/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,942,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10116/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,942,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10117/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,942,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10118/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,942,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10119/500000]
+ train/ActionL1Loss=0.0291
+ throughput/total_tokens=1,942,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10120/500000]
+ optim/total_grad_norm=8.225
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=1,943,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10121/500000]
+ train/ActionL1Loss=0.0293
+ throughput/total_tokens=1,943,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10122/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,943,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10123/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=1,943,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10124/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,943,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10125/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=1,944,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10126/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,944,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10127/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,944,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10128/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,944,576,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10129/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,944,768,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10130/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=1,944,960,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10131/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,945,152,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10132/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,945,344,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10133/500000]
+ train/ActionL1Loss=0.0311
+ throughput/total_tokens=1,945,536,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10134/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,945,728,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10135/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,945,920,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10136/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,946,112,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10137/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,946,304,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10138/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,946,496,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10139/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,946,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10140/500000]
+ optim/total_grad_norm=8.412
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,946,880,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10141/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,947,072,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10142/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,947,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10143/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=1,947,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10144/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,947,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10145/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,947,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10146/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,948,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10147/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,948,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10148/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,948,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10149/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,948,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10150/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,948,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10151/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=1,948,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10152/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,949,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10153/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,949,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10154/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,949,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10155/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,949,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10156/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=1,949,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10157/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,950,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10158/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,950,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10159/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=1,950,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10160/500000]
+ optim/total_grad_norm=7.872
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=1,950,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10161/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,950,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10162/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=1,951,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10163/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,951,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10164/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,951,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10165/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,951,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10166/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=1,951,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10167/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=1,952,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10168/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,952,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10169/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=1,952,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10170/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,952,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10171/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,952,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10172/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,953,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10173/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,953,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10174/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,953,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10175/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,953,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10176/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=1,953,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10177/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,953,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10178/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=1,954,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10179/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=1,954,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10180/500000]
+ optim/total_grad_norm=7.988
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,954,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10181/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,954,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10182/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,954,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10183/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,955,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10184/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,955,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10185/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,955,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10186/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,955,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10187/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,955,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10188/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,956,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10189/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,956,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10190/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,956,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10191/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,956,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10192/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,956,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10193/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,957,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10194/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,957,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10195/500000]
+ train/ActionL1Loss=0.0337
+ throughput/total_tokens=1,957,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10196/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=1,957,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10197/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,957,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10198/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,958,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10199/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,958,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10200/500000]
+ optim/total_grad_norm=8.457
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,958,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10201/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,958,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10202/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,958,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10203/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,958,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10204/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,959,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10205/500000]
+ train/ActionL1Loss=0.0148
+ throughput/total_tokens=1,959,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10206/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,959,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10207/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,959,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10208/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,959,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10209/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,960,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10210/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,960,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=10211/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=1,960,512,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10212/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,960,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10213/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,960,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10214/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,961,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10215/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,961,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10216/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,961,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10217/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,961,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10218/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,961,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10219/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=1,962,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10220/500000]
+ optim/total_grad_norm=8.018
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,962,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10221/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,962,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10222/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=1,962,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10223/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,962,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10224/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,963,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10225/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,963,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10226/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,963,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10227/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,963,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10228/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=1,963,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10229/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,963,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10230/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,964,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10231/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,964,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10232/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,964,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10233/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,964,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10234/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,964,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10235/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,965,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10236/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=1,965,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10237/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,965,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10238/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,965,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10239/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=1,965,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10240/500000]
+ optim/total_grad_norm=8.516
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,966,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10241/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=1,966,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10242/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,966,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10243/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=1,966,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10244/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,966,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10245/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,967,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10246/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=1,967,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10247/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,967,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10248/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,967,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10249/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=1,967,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10250/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=1,968,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10251/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,968,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10252/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=1,968,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10253/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,968,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10254/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,968,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10255/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,968,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10256/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,969,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10257/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,969,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10258/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,969,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10259/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,969,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10260/500000]
+ optim/total_grad_norm=8.534
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=1,969,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10261/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,970,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10262/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=1,970,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10263/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,970,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10264/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,970,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10265/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,970,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10266/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,971,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10267/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,971,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10268/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,971,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10269/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,971,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10270/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,971,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10271/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=1,972,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10272/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=1,972,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10273/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,972,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10274/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,972,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10275/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,972,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10276/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,972,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10277/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,973,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10278/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=1,973,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10279/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,973,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10280/500000]
+ optim/total_grad_norm=7.015
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=1,973,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10281/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,973,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10282/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=1,974,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10283/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,974,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10284/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,974,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10285/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,974,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10286/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,974,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10287/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=1,975,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10288/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,975,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10289/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,975,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10290/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,975,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10291/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,975,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10292/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,976,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10293/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=1,976,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10294/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=1,976,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10295/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,976,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10296/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,976,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10297/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=1,977,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10298/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,977,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10299/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,977,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10300/500000]
+ optim/total_grad_norm=7.704
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=1,977,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10301/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=1,977,792,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=10302/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=1,977,984,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=10303/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=1,978,176,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=10304/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,978,368,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=10305/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,978,560,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=10306/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,978,752,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=10307/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,978,944,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10308/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,979,136,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10309/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,979,328,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10310/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=1,979,520,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+ System/Peak GPU Memory (MB)=46,917
+[step=10311/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=1,979,712,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10312/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=1,979,904,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10313/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=1,980,096,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10314/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,980,288,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10315/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=1,980,480,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10316/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,980,672,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10317/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,980,864,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+[step=10318/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,981,056,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=10319/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=1,981,248,000
+ throughput/device/tokens_per_second=1,170
+ throughput/device/batches_per_second=0.0488
+[step=10320/500000]
+ optim/total_grad_norm=5.687
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=1,981,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10321/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=1,981,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10322/500000]
+ train/ActionL1Loss=0.0156
+ throughput/total_tokens=1,981,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10323/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,982,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10324/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=1,982,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10325/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,982,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10326/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=1,982,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10327/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=1,982,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10328/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,982,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10329/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,983,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10330/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,983,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10331/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=1,983,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10332/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,983,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10333/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,983,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10334/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=1,984,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10335/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,984,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10336/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,984,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10337/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,984,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10338/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,984,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10339/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=1,985,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10340/500000]
+ optim/total_grad_norm=6.755
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,985,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10341/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,985,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10342/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=1,985,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10343/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,985,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10344/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,986,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10345/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=1,986,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10346/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,986,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10347/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=1,986,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10348/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,986,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10349/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=1,987,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10350/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=1,987,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10351/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=1,987,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10352/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=1,987,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10353/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=1,987,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10354/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=1,987,968,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10355/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=1,988,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10356/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,988,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10357/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=1,988,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10358/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,988,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10359/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,988,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10360/500000]
+ optim/total_grad_norm=8.004
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=1,989,120,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10361/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,989,312,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10362/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,989,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10363/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=1,989,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10364/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=1,989,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10365/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=1,990,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10366/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=1,990,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10367/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=1,990,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10368/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,990,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10369/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=1,990,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10370/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,991,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10371/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=1,991,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10372/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,991,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10373/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=1,991,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10374/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=1,991,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10375/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,992,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10376/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,992,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10377/500000]
+ train/ActionL1Loss=0.0289
+ throughput/total_tokens=1,992,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10378/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=1,992,576,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10379/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=1,992,768,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10380/500000]
+ optim/total_grad_norm=6.996
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=1,992,960,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10381/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=1,993,152,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10382/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=1,993,344,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10383/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=1,993,536,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10384/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=1,993,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10385/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=1,993,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10386/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=1,994,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10387/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=1,994,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10388/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=1,994,496,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10389/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=1,994,688,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10390/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=1,994,880,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10391/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,995,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10392/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=1,995,264,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10393/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=1,995,456,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10394/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=1,995,648,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10395/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=1,995,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10396/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=1,996,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10397/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=1,996,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10398/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=1,996,416,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10399/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,996,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10400/500000]
+ optim/total_grad_norm=6.845
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,996,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10401/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=1,996,992,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10402/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=1,997,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10403/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=1,997,376,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10404/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,997,568,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10405/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=1,997,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10406/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=1,997,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10407/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=1,998,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10408/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=1,998,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10409/500000]
+ train/ActionL1Loss=0.0153
+ throughput/total_tokens=1,998,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10410/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=1,998,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10411/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=1,998,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10412/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=1,999,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10413/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=1,999,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10414/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=1,999,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10415/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=1,999,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10416/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=1,999,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10417/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,000,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10418/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,000,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10419/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,000,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10420/500000]
+ optim/total_grad_norm=8.456
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,000,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10421/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,000,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10422/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,001,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10423/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,001,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10424/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,001,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10425/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,001,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10426/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,001,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10427/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,001,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10428/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,002,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10429/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,002,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10430/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,002,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10431/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,002,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10432/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,002,944,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10433/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,003,136,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10434/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,003,328,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10435/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,003,520,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10436/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,003,712,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10437/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,003,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10438/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,004,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10439/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,004,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10440/500000]
+ optim/total_grad_norm=6.912
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,004,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10441/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,004,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10442/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,004,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10443/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=2,005,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10444/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,005,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10445/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=2,005,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10446/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,005,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10447/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,005,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10448/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,006,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10449/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,006,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10450/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,006,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10451/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,006,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10452/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,006,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10453/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,006,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10454/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=2,007,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10455/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,007,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10456/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=2,007,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10457/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,007,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10458/500000]
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=2,007,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10459/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,008,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10460/500000]
+ optim/total_grad_norm=6.476
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,008,320,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10461/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,008,512,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10462/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,008,704,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10463/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,008,896,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10464/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=2,009,088,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10465/500000]
+ train/ActionL1Loss=0.0288
+ throughput/total_tokens=2,009,280,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10466/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,009,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10467/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,009,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10468/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,009,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10469/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,010,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10470/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,010,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10471/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,010,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10472/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,010,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10473/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=2,010,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10474/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,011,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10475/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,011,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10476/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,011,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10477/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=2,011,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10478/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,011,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10479/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,011,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10480/500000]
+ optim/total_grad_norm=8.504
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,012,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10481/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,012,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10482/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=2,012,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10483/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,012,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10484/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=2,012,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10485/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,013,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10486/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,013,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10487/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,013,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10488/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,013,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10489/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,013,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10490/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,014,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10491/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,014,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10492/500000]
+ train/ActionL1Loss=0.0342
+ throughput/total_tokens=2,014,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10493/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=2,014,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10494/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,014,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10495/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,015,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10496/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,015,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10497/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,015,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10498/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,015,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10499/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,015,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10500/500000]
+ optim/total_grad_norm=10.35
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,016,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+10/05 [05:20:36] INFO | >> Saving config... checkpoint.py:608
+10/05 [05:21:25] INFO | >> Saving model state... checkpoint.py:796
+10/05 [05:22:33] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [05:24:00] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10501/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,016,192,000
+ throughput/device/tokens_per_second=1,220
+ throughput/device/batches_per_second=0.0509
+[step=10502/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,016,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10503/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,016,576,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10504/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,016,768,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=10505/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,016,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10506/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=2,017,152,000
+ throughput/device/tokens_per_second=1,158
+ throughput/device/batches_per_second=0.0483
+[step=10507/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,017,344,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0485
+[step=10508/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=2,017,536,000
+ throughput/device/tokens_per_second=1,166
+ throughput/device/batches_per_second=0.0486
+[step=10509/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,017,728,000
+ throughput/device/tokens_per_second=1,168
+ throughput/device/batches_per_second=0.0487
+[step=10510/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,017,920,000
+ throughput/device/tokens_per_second=1,169
+ throughput/device/batches_per_second=0.0487
+ System/Peak GPU Memory (MB)=46,917
+[step=10511/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,018,112,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=10512/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=2,018,304,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0488
+[step=10513/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,018,496,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=10514/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=2,018,688,000
+ throughput/device/tokens_per_second=1,174
+ throughput/device/batches_per_second=0.0489
+[step=10515/500000]
+ train/ActionL1Loss=0.0314
+ throughput/total_tokens=2,018,880,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10516/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=2,019,072,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=10517/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,019,264,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=10518/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,019,456,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0490
+[step=10519/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,019,648,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=10520/500000]
+ optim/total_grad_norm=9.783
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,019,840,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+ System/Peak GPU Memory (MB)=46,917
+[step=10521/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,020,032,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=10522/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,020,224,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=10523/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,020,416,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10524/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,020,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10525/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,020,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10526/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,020,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10527/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,021,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10528/500000]
+ train/ActionL1Loss=0.0306
+ throughput/total_tokens=2,021,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10529/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,021,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10530/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,021,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10531/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=2,021,952,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10532/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,022,144,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10533/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,022,336,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10534/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,022,528,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10535/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,022,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10536/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,022,912,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10537/500000]
+ train/ActionL1Loss=0.0140
+ throughput/total_tokens=2,023,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10538/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,023,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10539/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,023,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10540/500000]
+ optim/total_grad_norm=7.195
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,023,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10541/500000]
+ train/ActionL1Loss=0.0156
+ throughput/total_tokens=2,023,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10542/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,024,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10543/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=2,024,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10544/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,024,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10545/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,024,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10546/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,024,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10547/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,025,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10548/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,025,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10549/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=2,025,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10550/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,025,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10551/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,025,792,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10552/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,025,984,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10553/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,026,176,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10554/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,026,368,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10555/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,026,560,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10556/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=2,026,752,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10557/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,026,944,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10558/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,027,136,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10559/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,027,328,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10560/500000]
+ optim/total_grad_norm=6.772
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,027,520,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=10561/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=2,027,712,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=10562/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,027,904,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=10563/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,028,096,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=10564/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,028,288,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=10565/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,028,480,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=10566/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,028,672,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=10567/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=2,028,864,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=10568/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,029,056,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=10569/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=2,029,248,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=10570/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,029,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10571/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,029,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10572/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,029,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10573/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,030,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10574/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,030,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10575/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,030,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10576/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,030,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10577/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,030,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10578/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,030,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10579/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,031,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10580/500000]
+ optim/total_grad_norm=7.496
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,031,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10581/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,031,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10582/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,031,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10583/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,031,936,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10584/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,032,128,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10585/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=2,032,320,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10586/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,032,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10587/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,032,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10588/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,032,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10589/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,033,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10590/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,033,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10591/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,033,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10592/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,033,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10593/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,033,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10594/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,034,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10595/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,034,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10596/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,034,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10597/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,034,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10598/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,034,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10599/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,035,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10600/500000]
+ optim/total_grad_norm=9.051
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,035,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10601/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,035,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10602/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,035,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10603/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,035,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10604/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,035,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10605/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,036,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10606/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,036,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10607/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,036,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10608/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,036,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10609/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,036,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10610/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=2,037,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10611/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,037,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10612/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,037,504,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10613/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,037,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10614/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,037,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10615/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,038,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10616/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,038,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10617/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,038,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10618/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,038,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10619/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,038,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10620/500000]
+ optim/total_grad_norm=6.703
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,039,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10621/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,039,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10622/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,039,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10623/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,039,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10624/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,039,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10625/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,040,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10626/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=2,040,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10627/500000]
+ train/ActionL1Loss=0.0150
+ throughput/total_tokens=2,040,384,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10628/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,040,576,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10629/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,040,768,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10630/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,040,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10631/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,041,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10632/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,041,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10633/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,041,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10634/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,041,728,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10635/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,041,920,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10636/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,042,112,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10637/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,042,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10638/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,042,496,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10639/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,042,688,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10640/500000]
+ optim/total_grad_norm=8.415
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,042,880,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10641/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,043,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10642/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=2,043,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10643/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=2,043,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10644/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,043,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10645/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,043,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10646/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,044,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10647/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,044,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10648/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,044,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10649/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,044,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10650/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,044,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10651/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,044,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10652/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,045,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10653/500000]
+ train/ActionL1Loss=0.0317
+ throughput/total_tokens=2,045,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10654/500000]
+ train/ActionL1Loss=0.0304
+ throughput/total_tokens=2,045,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10655/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,045,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10656/500000]
+ train/ActionL1Loss=0.0269
+ throughput/total_tokens=2,045,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10657/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=2,046,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10658/500000]
+ train/ActionL1Loss=0.0299
+ throughput/total_tokens=2,046,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10659/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,046,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10660/500000]
+ optim/total_grad_norm=6.875
+ train/ActionL1Loss=0.0278
+ throughput/total_tokens=2,046,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=10661/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,046,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10662/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,047,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10663/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,047,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10664/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,047,488,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10665/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,047,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10666/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,047,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10667/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,048,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10668/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=2,048,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10669/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,048,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10670/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=2,048,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10671/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,048,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10672/500000]
+ train/ActionL1Loss=0.0275
+ throughput/total_tokens=2,049,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10673/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,049,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10674/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,049,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10675/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,049,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10676/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,049,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10677/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=2,049,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10678/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,050,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10679/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,050,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10680/500000]
+ optim/total_grad_norm=8.370
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=2,050,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10681/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,050,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10682/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,050,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10683/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=2,051,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10684/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,051,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10685/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,051,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10686/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,051,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10687/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,051,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10688/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,052,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10689/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,052,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10690/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,052,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10691/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=2,052,672,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10692/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,052,864,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10693/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,053,056,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10694/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,053,248,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10695/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,053,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10696/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,053,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10697/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,053,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10698/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,054,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10699/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,054,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10700/500000]
+ optim/total_grad_norm=6.852
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,054,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10701/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,054,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10702/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,054,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10703/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,054,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10704/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,055,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10705/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,055,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10706/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,055,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10707/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,055,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10708/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,055,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10709/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,056,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10710/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,056,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10711/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,056,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10712/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,056,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10713/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,056,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10714/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,057,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10715/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,057,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10716/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,057,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10717/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,057,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10718/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=2,057,856,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10719/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,058,048,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10720/500000]
+ optim/total_grad_norm=7.434
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,058,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10721/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,058,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10722/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=2,058,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10723/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=2,058,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10724/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,059,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10725/500000]
+ train/ActionL1Loss=0.0266
+ throughput/total_tokens=2,059,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10726/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,059,392,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10727/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,059,584,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10728/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=2,059,776,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10729/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=2,059,968,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10730/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,060,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10731/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,060,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10732/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,060,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10733/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,060,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10734/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=2,060,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10735/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,061,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10736/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=2,061,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10737/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,061,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10738/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,061,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10739/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,061,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10740/500000]
+ optim/total_grad_norm=8.424
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,062,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10741/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,062,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10742/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,062,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10743/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,062,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10744/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,062,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10745/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,063,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10746/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,063,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10747/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,063,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10748/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,063,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10749/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=2,063,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10750/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,064,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10751/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,064,192,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10752/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,064,384,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10753/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,064,576,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0488
+[step=10754/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,064,768,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0488
+[step=10755/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,064,960,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0488
+[step=10756/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,065,152,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10757/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,065,344,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10758/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,065,536,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10759/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,065,728,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10760/500000]
+ optim/total_grad_norm=8.290
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,065,920,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+ System/Peak GPU Memory (MB)=46,917
+[step=10761/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=2,066,112,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10762/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=2,066,304,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10763/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=2,066,496,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10764/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,066,688,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10765/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,066,880,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10766/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,067,072,000
+ throughput/device/tokens_per_second=1,172
+ throughput/device/batches_per_second=0.0489
+[step=10767/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,067,264,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=10768/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,067,456,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=10769/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,067,648,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=10770/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,067,840,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=10771/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,068,032,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10772/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,068,224,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10773/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,068,416,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10774/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,068,608,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10775/500000]
+ train/ActionL1Loss=0.0274
+ throughput/total_tokens=2,068,800,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10776/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,068,992,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10777/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,069,184,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10778/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=2,069,376,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10779/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,069,568,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10780/500000]
+ optim/total_grad_norm=7.986
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,069,760,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=10781/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,069,952,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10782/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,070,144,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10783/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,070,336,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10784/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,070,528,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10785/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,070,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10786/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,070,912,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10787/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=2,071,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10788/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,071,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10789/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,071,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10790/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,071,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10791/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=2,071,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10792/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=2,072,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10793/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,072,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10794/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=2,072,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10795/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,072,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10796/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,072,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10797/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,073,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10798/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,073,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10799/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,073,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10800/500000]
+ optim/total_grad_norm=8.247
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,073,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10801/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,073,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10802/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,073,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10803/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,074,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10804/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,074,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10805/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,074,560,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10806/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=2,074,752,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10807/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=2,074,944,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10808/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,075,136,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10809/500000]
+ train/ActionL1Loss=0.0294
+ throughput/total_tokens=2,075,328,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10810/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,075,520,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=10811/500000]
+ train/ActionL1Loss=0.0160
+ throughput/total_tokens=2,075,712,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10812/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,075,904,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10813/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,076,096,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10814/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,076,288,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10815/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,076,480,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=10816/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,076,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10817/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=2,076,864,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10818/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,077,056,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10819/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=2,077,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10820/500000]
+ optim/total_grad_norm=8.517
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=2,077,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10821/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=2,077,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10822/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,077,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10823/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,078,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10824/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,078,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10825/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,078,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10826/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,078,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10827/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,078,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10828/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,078,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10829/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=2,079,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10830/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=2,079,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10831/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,079,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10832/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,079,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10833/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=2,079,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10834/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,080,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10835/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,080,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10836/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,080,512,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10837/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,080,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10838/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,080,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10839/500000]
+ train/ActionL1Loss=0.0297
+ throughput/total_tokens=2,081,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10840/500000]
+ optim/total_grad_norm=9.961
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,081,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10841/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,081,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10842/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,081,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10843/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,081,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10844/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,082,048,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10845/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,082,240,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10846/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,082,432,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10847/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,082,624,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10848/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,082,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10849/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,083,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10850/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,083,200,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10851/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,083,392,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10852/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,083,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10853/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,083,776,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10854/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=2,083,968,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10855/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,084,160,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10856/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=2,084,352,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10857/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,084,544,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10858/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,084,736,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10859/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,084,928,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10860/500000]
+ optim/total_grad_norm=9.501
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,085,120,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10861/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=2,085,312,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10862/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,085,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10863/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,085,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10864/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=2,085,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10865/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,086,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10866/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,086,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10867/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,086,464,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10868/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,086,656,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10869/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,086,848,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10870/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,087,040,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=10871/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,087,232,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10872/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,087,424,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10873/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,087,616,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10874/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,087,808,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10875/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,088,000,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10876/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,088,192,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10877/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,088,384,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10878/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,088,576,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10879/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,088,768,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10880/500000]
+ optim/total_grad_norm=6.060
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=2,088,960,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10881/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,089,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10882/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,089,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10883/500000]
+ train/ActionL1Loss=0.0292
+ throughput/total_tokens=2,089,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10884/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,089,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10885/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,089,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10886/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,090,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10887/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,090,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10888/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,090,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10889/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,090,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10890/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,090,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10891/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,091,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10892/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,091,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10893/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,091,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10894/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,091,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=10895/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,091,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10896/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,092,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10897/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,092,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10898/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,092,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10899/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,092,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10900/500000]
+ optim/total_grad_norm=6.326
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,092,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10901/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,092,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10902/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,093,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10903/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,093,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10904/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,093,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10905/500000]
+ train/ActionL1Loss=0.0160
+ throughput/total_tokens=2,093,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10906/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,093,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10907/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,094,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10908/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,094,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10909/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,094,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10910/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,094,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=10911/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,094,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10912/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,095,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10913/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,095,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=10914/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,095,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10915/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,095,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10916/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,095,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10917/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,096,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10918/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,096,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10919/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,096,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10920/500000]
+ optim/total_grad_norm=9.498
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,096,640,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10921/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,096,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10922/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,097,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10923/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,097,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10924/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,097,408,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10925/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,097,600,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10926/500000]
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=2,097,792,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10927/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,097,984,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10928/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,098,176,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10929/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,098,368,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10930/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,098,560,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10931/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,098,752,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10932/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,098,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10933/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,099,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10934/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,099,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10935/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,099,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10936/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,099,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10937/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,099,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10938/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,100,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10939/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,100,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10940/500000]
+ optim/total_grad_norm=7.842
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,100,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10941/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,100,672,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10942/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,100,864,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10943/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,101,056,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10944/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,101,248,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10945/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,101,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10946/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,101,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10947/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,101,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10948/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,102,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10949/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,102,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10950/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,102,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10951/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,102,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10952/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=2,102,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=10953/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,102,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10954/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,103,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10955/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,103,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10956/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,103,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10957/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,103,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10958/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,103,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10959/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=2,104,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10960/500000]
+ optim/total_grad_norm=8.068
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,104,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=10961/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,104,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10962/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,104,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10963/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,104,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10964/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,105,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10965/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,105,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=10966/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=2,105,472,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10967/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,105,664,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=10968/500000]
+ train/ActionL1Loss=0.0300
+ throughput/total_tokens=2,105,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10969/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=2,106,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=10970/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,106,240,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+ System/Peak GPU Memory (MB)=46,917
+[step=10971/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,106,432,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=10972/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=2,106,624,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10973/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,106,816,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10974/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,107,008,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10975/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,107,200,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10976/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,107,392,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10977/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,107,584,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10978/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,107,776,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10979/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=2,107,968,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=10980/500000]
+ optim/total_grad_norm=6.907
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=2,108,160,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10981/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,108,352,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=10982/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,108,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10983/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,108,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10984/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,108,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10985/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,109,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10986/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,109,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10987/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,109,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10988/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,109,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10989/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=2,109,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10990/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,110,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=10991/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,110,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10992/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,110,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10993/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=2,110,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10994/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,110,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10995/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,111,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10996/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,111,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10997/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,111,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10998/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,111,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=10999/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,111,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11000/500000]
+ optim/total_grad_norm=7.118
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,112,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/05 [08:14:17] INFO | >> Saving config... checkpoint.py:608
+10/05 [08:14:53] INFO | >> Saving model state... checkpoint.py:796
+10/05 [08:16:03] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [08:17:33] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11001/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,112,192,000
+ throughput/device/tokens_per_second=1,221
+ throughput/device/batches_per_second=0.0509
+[step=11002/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,112,384,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=11003/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,112,576,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=11004/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,112,768,000
+ throughput/device/tokens_per_second=1,162
+ throughput/device/batches_per_second=0.0484
+[step=11005/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,112,960,000
+ throughput/device/tokens_per_second=1,167
+ throughput/device/batches_per_second=0.0487
+[step=11006/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,113,152,000
+ throughput/device/tokens_per_second=1,171
+ throughput/device/batches_per_second=0.0488
+[step=11007/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,113,344,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+[step=11008/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=2,113,536,000
+ throughput/device/tokens_per_second=1,175
+ throughput/device/batches_per_second=0.0490
+[step=11009/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,113,728,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+[step=11010/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,113,920,000
+ throughput/device/tokens_per_second=1,176
+ throughput/device/batches_per_second=0.0490
+ System/Peak GPU Memory (MB)=46,917
+[step=11011/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,114,112,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=11012/500000]
+ train/ActionL1Loss=0.0148
+ throughput/total_tokens=2,114,304,000
+ throughput/device/tokens_per_second=1,178
+ throughput/device/batches_per_second=0.0491
+[step=11013/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,114,496,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=11014/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,114,688,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0492
+[step=11015/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,114,880,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=11016/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,115,072,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=11017/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,115,264,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11018/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,115,456,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11019/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,115,648,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11020/500000]
+ optim/total_grad_norm=8.653
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,115,840,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+ System/Peak GPU Memory (MB)=46,917
+[step=11021/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,116,032,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11022/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,116,224,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11023/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,116,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11024/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,116,608,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11025/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,116,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11026/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,116,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11027/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,117,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11028/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=2,117,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11029/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,117,568,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11030/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,117,760,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11031/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,117,952,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11032/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,118,144,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11033/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,118,336,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11034/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,118,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11035/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,118,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11036/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,118,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11037/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=2,119,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11038/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,119,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11039/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,119,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11040/500000]
+ optim/total_grad_norm=9.619
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,119,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11041/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,119,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11042/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,120,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11043/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,120,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11044/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=2,120,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11045/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,120,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11046/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,120,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11047/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,121,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11048/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,121,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11049/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,121,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11050/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,121,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11051/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,121,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11052/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,121,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11053/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,122,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11054/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,122,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11055/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,122,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11056/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,122,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11057/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,122,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11058/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,123,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11059/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,123,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11060/500000]
+ optim/total_grad_norm=8.709
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,123,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11061/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,123,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11062/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,123,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11063/500000]
+ train/ActionL1Loss=0.0147
+ throughput/total_tokens=2,124,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11064/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,124,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11065/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,124,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11066/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,124,672,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11067/500000]
+ train/ActionL1Loss=0.0153
+ throughput/total_tokens=2,124,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11068/500000]
+ train/ActionL1Loss=0.0147
+ throughput/total_tokens=2,125,056,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11069/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,125,248,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11070/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,125,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11071/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,125,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11072/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,125,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11073/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,126,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11074/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,126,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11075/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,126,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11076/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,126,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11077/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=2,126,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11078/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,126,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11079/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=2,127,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11080/500000]
+ optim/total_grad_norm=7.144
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,127,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11081/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,127,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11082/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,127,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11083/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,127,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11084/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,128,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11085/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,128,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11086/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,128,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11087/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=2,128,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11088/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,128,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11089/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,129,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11090/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,129,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11091/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,129,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11092/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=2,129,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11093/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,129,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11094/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,130,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11095/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,130,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11096/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=2,130,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11097/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,130,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11098/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=2,130,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11099/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,131,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11100/500000]
+ optim/total_grad_norm=7.778
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,131,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11101/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,131,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11102/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,131,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11103/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=2,131,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11104/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,131,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11105/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,132,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11106/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,132,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11107/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=2,132,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11108/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,132,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11109/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,132,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11110/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,133,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11111/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,133,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11112/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,133,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11113/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,133,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11114/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,133,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11115/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,134,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11116/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,134,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11117/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,134,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11118/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,134,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11119/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,134,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11120/500000]
+ optim/total_grad_norm=7.234
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,135,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11121/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,135,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11122/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,135,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11123/500000]
+ train/ActionL1Loss=0.0155
+ throughput/total_tokens=2,135,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11124/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,135,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11125/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,136,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11126/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,136,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11127/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,136,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11128/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,136,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11129/500000]
+ train/ActionL1Loss=0.0249
+ throughput/total_tokens=2,136,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11130/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=2,136,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11131/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,137,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11132/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,137,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11133/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,137,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11134/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,137,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11135/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,137,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11136/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,138,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11137/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,138,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11138/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,138,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11139/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,138,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11140/500000]
+ optim/total_grad_norm=8.213
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,138,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11141/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,139,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11142/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,139,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11143/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,139,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11144/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,139,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11145/500000]
+ train/ActionL1Loss=0.0267
+ throughput/total_tokens=2,139,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11146/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,140,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11147/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,140,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11148/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,140,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11149/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=2,140,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11150/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,140,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11151/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=2,140,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11152/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,141,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11153/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,141,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11154/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,141,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11155/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,141,760,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11156/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,141,952,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11157/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=2,142,144,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11158/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,142,336,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11159/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,142,528,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11160/500000]
+ optim/total_grad_norm=8.197
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,142,720,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11161/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,142,912,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11162/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,143,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11163/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,143,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11164/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,143,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11165/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,143,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11166/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,143,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11167/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,144,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11168/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,144,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11169/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,144,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11170/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=2,144,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11171/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,144,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11172/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,145,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11173/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,145,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11174/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,145,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11175/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,145,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11176/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,145,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11177/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,145,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11178/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,146,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11179/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,146,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11180/500000]
+ optim/total_grad_norm=7.310
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,146,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11181/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,146,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11182/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,146,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11183/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,147,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11184/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,147,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11185/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,147,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11186/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,147,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11187/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,147,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11188/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,148,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11189/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,148,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11190/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,148,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11191/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,148,672,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11192/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,148,864,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11193/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=2,149,056,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11194/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=2,149,248,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11195/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,149,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11196/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,149,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11197/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,149,824,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11198/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=2,150,016,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11199/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,150,208,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11200/500000]
+ optim/total_grad_norm=7.389
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,150,400,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11201/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=2,150,592,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11202/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=2,150,784,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11203/500000]
+ train/ActionL1Loss=0.0273
+ throughput/total_tokens=2,150,976,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11204/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=2,151,168,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11205/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,151,360,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11206/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=2,151,552,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11207/500000]
+ train/ActionL1Loss=0.0307
+ throughput/total_tokens=2,151,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11208/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=2,151,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11209/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,152,128,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11210/500000]
+ train/ActionL1Loss=0.0285
+ throughput/total_tokens=2,152,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11211/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,152,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11212/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,152,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11213/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,152,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11214/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,153,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11215/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,153,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11216/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,153,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11217/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,153,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11218/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=2,153,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11219/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,154,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11220/500000]
+ optim/total_grad_norm=7.599
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,154,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11221/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,154,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11222/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,154,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11223/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=2,154,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11224/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,155,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11225/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,155,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11226/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,155,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11227/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,155,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11228/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,155,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11229/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,155,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11230/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,156,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11231/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=2,156,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11232/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=2,156,544,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11233/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,156,736,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11234/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,156,928,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11235/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,157,120,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11236/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=2,157,312,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11237/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,157,504,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11238/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,157,696,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11239/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,157,888,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11240/500000]
+ optim/total_grad_norm=7.200
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,158,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11241/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,158,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11242/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,158,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11243/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,158,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11244/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,158,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11245/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,159,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11246/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,159,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11247/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,159,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11248/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,159,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11249/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,159,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11250/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,160,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11251/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,160,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11252/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,160,384,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11253/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,160,576,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11254/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,160,768,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11255/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,160,960,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11256/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,161,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11257/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=2,161,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11258/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,161,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11259/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,161,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11260/500000]
+ optim/total_grad_norm=8.090
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,161,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11261/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,162,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11262/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,162,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11263/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,162,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11264/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,162,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11265/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,162,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11266/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,163,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11267/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,163,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11268/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,163,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11269/500000]
+ train/ActionL1Loss=0.0143
+ throughput/total_tokens=2,163,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11270/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,163,840,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11271/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,164,032,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11272/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,164,224,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11273/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,164,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11274/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,164,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11275/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,164,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11276/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,164,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11277/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,165,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11278/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,165,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11279/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,165,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11280/500000]
+ optim/total_grad_norm=9.387
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,165,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11281/500000]
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=2,165,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11282/500000]
+ train/ActionL1Loss=0.0139
+ throughput/total_tokens=2,166,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11283/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,166,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11284/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,166,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11285/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,166,720,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11286/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,166,912,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11287/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,167,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11288/500000]
+ train/ActionL1Loss=0.0153
+ throughput/total_tokens=2,167,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11289/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,167,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11290/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,167,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11291/500000]
+ train/ActionL1Loss=0.0286
+ throughput/total_tokens=2,167,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11292/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,168,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11293/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,168,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11294/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,168,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11295/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,168,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11296/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,168,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11297/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=2,169,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11298/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,169,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11299/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,169,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11300/500000]
+ optim/total_grad_norm=9.065
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,169,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11301/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,169,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11302/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,169,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11303/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=2,170,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11304/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,170,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11305/500000]
+ train/ActionL1Loss=0.0156
+ throughput/total_tokens=2,170,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11306/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,170,752,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11307/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,170,944,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11308/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,171,136,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11309/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,171,328,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11310/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,171,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11311/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,171,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11312/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,171,904,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11313/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,172,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11314/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,172,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11315/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,172,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11316/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,172,672,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11317/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,172,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11318/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,173,056,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11319/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,173,248,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11320/500000]
+ optim/total_grad_norm=7.905
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,173,440,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11321/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,173,632,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11322/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,173,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11323/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,174,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11324/500000]
+ train/ActionL1Loss=0.0242
+ throughput/total_tokens=2,174,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11325/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,174,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11326/500000]
+ train/ActionL1Loss=0.0150
+ throughput/total_tokens=2,174,592,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11327/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,174,784,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11328/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,174,976,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11329/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,175,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11330/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=2,175,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11331/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,175,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11332/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,175,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11333/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=2,175,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11334/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,176,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11335/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,176,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11336/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,176,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11337/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,176,704,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11338/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=2,176,896,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11339/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,177,088,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11340/500000]
+ optim/total_grad_norm=7.924
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,177,280,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11341/500000]
+ train/ActionL1Loss=0.0321
+ throughput/total_tokens=2,177,472,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11342/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,177,664,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11343/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,177,856,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11344/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,178,048,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11345/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,178,240,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11346/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,178,432,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11347/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,178,624,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11348/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,178,816,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11349/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,179,008,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11350/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,179,200,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11351/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,179,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11352/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,179,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11353/500000]
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=2,179,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11354/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,179,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11355/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,180,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11356/500000]
+ train/ActionL1Loss=0.0268
+ throughput/total_tokens=2,180,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11357/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,180,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11358/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,180,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11359/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,180,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11360/500000]
+ optim/total_grad_norm=6.232
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,181,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11361/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,181,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11362/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,181,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11363/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=2,181,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11364/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,181,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11365/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,182,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11366/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,182,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11367/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,182,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11368/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,182,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11369/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,182,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11370/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,183,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11371/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,183,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11372/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,183,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11373/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,183,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11374/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,183,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11375/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,184,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11376/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,184,192,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11377/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,184,384,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11378/500000]
+ train/ActionL1Loss=0.0263
+ throughput/total_tokens=2,184,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11379/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,184,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11380/500000]
+ optim/total_grad_norm=7.828
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,184,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11381/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,185,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11382/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,185,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11383/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,185,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11384/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,185,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11385/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=2,185,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11386/500000]
+ train/ActionL1Loss=0.0257
+ throughput/total_tokens=2,186,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11387/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,186,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11388/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,186,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11389/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,186,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11390/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,186,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11391/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,187,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11392/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,187,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11393/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,187,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11394/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,187,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11395/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,187,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11396/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,188,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11397/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,188,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11398/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,188,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11399/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,188,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11400/500000]
+ optim/total_grad_norm=7.621
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,188,800,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11401/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,188,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11402/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,189,184,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11403/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,189,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11404/500000]
+ train/ActionL1Loss=0.0153
+ throughput/total_tokens=2,189,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11405/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,189,760,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11406/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,189,952,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11407/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,190,144,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11408/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,190,336,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11409/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,190,528,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11410/500000]
+ train/ActionL1Loss=0.0276
+ throughput/total_tokens=2,190,720,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11411/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,190,912,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11412/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,191,104,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11413/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,191,296,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11414/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,191,488,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11415/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,191,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11416/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,191,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11417/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,192,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11418/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,192,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11419/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,192,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11420/500000]
+ optim/total_grad_norm=7.031
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,192,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11421/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,192,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11422/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,193,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11423/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,193,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11424/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,193,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11425/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,193,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11426/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,193,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11427/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=2,193,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11428/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,194,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11429/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,194,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11430/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,194,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11431/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,194,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11432/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,194,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11433/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,195,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11434/500000]
+ train/ActionL1Loss=0.0137
+ throughput/total_tokens=2,195,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11435/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,195,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11436/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,195,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11437/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,195,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11438/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,196,096,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11439/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,196,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11440/500000]
+ optim/total_grad_norm=6.868
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,196,480,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11441/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,196,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11442/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,196,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11443/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,197,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11444/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,197,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11445/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,197,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11446/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,197,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11447/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,197,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11448/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,198,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11449/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,198,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11450/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,198,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11451/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,198,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11452/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,198,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11453/500000]
+ train/ActionL1Loss=0.0251
+ throughput/total_tokens=2,198,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11454/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,199,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11455/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,199,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11456/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,199,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11457/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,199,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11458/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=2,199,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11459/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,200,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11460/500000]
+ optim/total_grad_norm=10.60
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,200,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=11461/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,200,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11462/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,200,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11463/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,200,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11464/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,201,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11465/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,201,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11466/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,201,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11467/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,201,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11468/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,201,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11469/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,202,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11470/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,202,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11471/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,202,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11472/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,202,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11473/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,202,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11474/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=2,203,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11475/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,203,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11476/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,203,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11477/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,203,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11478/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,203,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11479/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,203,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11480/500000]
+ optim/total_grad_norm=8.560
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,204,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11481/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,204,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11482/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,204,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11483/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,204,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11484/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,204,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11485/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,205,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11486/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,205,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11487/500000]
+ train/ActionL1Loss=0.0326
+ throughput/total_tokens=2,205,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11488/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,205,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11489/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,205,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11490/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,206,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11491/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,206,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11492/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,206,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11493/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,206,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11494/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,206,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11495/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,207,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11496/500000]
+ train/ActionL1Loss=0.0155
+ throughput/total_tokens=2,207,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11497/500000]
+ train/ActionL1Loss=0.0338
+ throughput/total_tokens=2,207,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11498/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,207,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11499/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,207,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11500/500000]
+ optim/total_grad_norm=7.959
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,208,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/05 [11:07:52] INFO | >> Saving config... checkpoint.py:608
+10/05 [11:08:28] INFO | >> Saving model state... checkpoint.py:796
+10/05 [11:09:38] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [11:11:05] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11501/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,208,192,000
+ throughput/device/tokens_per_second=1,213
+ throughput/device/batches_per_second=0.0506
+[step=11502/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,208,384,000
+ throughput/device/tokens_per_second=1,179
+ throughput/device/batches_per_second=0.0491
+[step=11503/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,208,576,000
+ throughput/device/tokens_per_second=1,177
+ throughput/device/batches_per_second=0.0491
+[step=11504/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,208,768,000
+ throughput/device/tokens_per_second=1,180
+ throughput/device/batches_per_second=0.0492
+[step=11505/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,208,960,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11506/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,209,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11507/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,209,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11508/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=2,209,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11509/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=2,209,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11510/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,209,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11511/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,210,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11512/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,210,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11513/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,210,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11514/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,210,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11515/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,210,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11516/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,211,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11517/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,211,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11518/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,211,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11519/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,211,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11520/500000]
+ optim/total_grad_norm=8.397
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=2,211,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11521/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,212,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11522/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,212,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11523/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,212,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11524/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,212,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11525/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,212,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11526/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,212,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11527/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,213,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11528/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,213,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11529/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,213,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11530/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,213,760,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11531/500000]
+ train/ActionL1Loss=0.0153
+ throughput/total_tokens=2,213,952,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11532/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=2,214,144,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11533/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,214,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11534/500000]
+ train/ActionL1Loss=0.0160
+ throughput/total_tokens=2,214,528,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11535/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,214,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11536/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,214,912,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11537/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,215,104,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11538/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=2,215,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11539/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,215,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11540/500000]
+ optim/total_grad_norm=7.190
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=2,215,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11541/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,215,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11542/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,216,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11543/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,216,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11544/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,216,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11545/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,216,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11546/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,216,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11547/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,217,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11548/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,217,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11549/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,217,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11550/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,217,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11551/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,217,792,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11552/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,217,984,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11553/500000]
+ train/ActionL1Loss=0.0144
+ throughput/total_tokens=2,218,176,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11554/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,218,368,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11555/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,218,560,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11556/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,218,752,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11557/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,218,944,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11558/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,219,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11559/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,219,328,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11560/500000]
+ optim/total_grad_norm=8.136
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,219,520,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=11561/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,219,712,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11562/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,219,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11563/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,220,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11564/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,220,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11565/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,220,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11566/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,220,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11567/500000]
+ train/ActionL1Loss=0.0248
+ throughput/total_tokens=2,220,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11568/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,221,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11569/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,221,248,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11570/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=2,221,440,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11571/500000]
+ train/ActionL1Loss=0.0295
+ throughput/total_tokens=2,221,632,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11572/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,221,824,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11573/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,222,016,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11574/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,222,208,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11575/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,222,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11576/500000]
+ train/ActionL1Loss=0.0246
+ throughput/total_tokens=2,222,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11577/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=2,222,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11578/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,222,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11579/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,223,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11580/500000]
+ optim/total_grad_norm=6.408
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,223,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11581/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,223,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11582/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,223,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11583/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,223,936,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11584/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,224,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11585/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,224,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11586/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,224,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11587/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,224,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11588/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,224,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11589/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,225,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11590/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,225,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11591/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,225,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11592/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,225,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11593/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,225,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11594/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,226,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11595/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,226,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11596/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,226,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11597/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,226,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11598/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,226,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11599/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,227,008,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11600/500000]
+ optim/total_grad_norm=6.449
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,227,200,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11601/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,227,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11602/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,227,584,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11603/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,227,776,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11604/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,227,968,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11605/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,228,160,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11606/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,228,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11607/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,228,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11608/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,228,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11609/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,228,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11610/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,229,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11611/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,229,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11612/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,229,504,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11613/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,229,696,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11614/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,229,888,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11615/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,230,080,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11616/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,230,272,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11617/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,230,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11618/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,230,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11619/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,230,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11620/500000]
+ optim/total_grad_norm=8.907
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,231,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11621/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,231,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11622/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,231,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11623/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,231,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11624/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,231,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11625/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,232,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11626/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,232,192,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11627/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,232,384,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11628/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,232,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11629/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,232,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11630/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,232,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11631/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,233,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11632/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,233,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11633/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,233,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11634/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,233,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11635/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,233,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11636/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,234,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11637/500000]
+ train/ActionL1Loss=0.0147
+ throughput/total_tokens=2,234,304,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11638/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,234,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11639/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,234,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11640/500000]
+ optim/total_grad_norm=8.548
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,234,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11641/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,235,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11642/500000]
+ train/ActionL1Loss=0.0145
+ throughput/total_tokens=2,235,264,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11643/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,235,456,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11644/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,235,648,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11645/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,235,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11646/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,236,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11647/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,236,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11648/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,236,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11649/500000]
+ train/ActionL1Loss=0.0147
+ throughput/total_tokens=2,236,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11650/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,236,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11651/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,236,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11652/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,237,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11653/500000]
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=2,237,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11654/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,237,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11655/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,237,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11656/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,237,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11657/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,238,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11658/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,238,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11659/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,238,528,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11660/500000]
+ optim/total_grad_norm=7.221
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,238,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=11661/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,238,912,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11662/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,239,104,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11663/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,239,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11664/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=2,239,488,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11665/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,239,680,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11666/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,239,872,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11667/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=2,240,064,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11668/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,240,256,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11669/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,240,448,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11670/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,240,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11671/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,240,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11672/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,241,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11673/500000]
+ train/ActionL1Loss=0.0271
+ throughput/total_tokens=2,241,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11674/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,241,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11675/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,241,600,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11676/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,241,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11677/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,241,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11678/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,242,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11679/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,242,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11680/500000]
+ optim/total_grad_norm=8.471
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,242,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11681/500000]
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=2,242,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11682/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,242,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11683/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,243,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11684/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,243,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11685/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,243,520,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11686/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,243,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11687/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,243,904,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11688/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,244,096,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11689/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,244,288,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11690/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,244,480,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11691/500000]
+ train/ActionL1Loss=0.0137
+ throughput/total_tokens=2,244,672,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11692/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,244,864,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11693/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,245,056,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11694/500000]
+ train/ActionL1Loss=0.0282
+ throughput/total_tokens=2,245,248,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11695/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,245,440,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11696/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,245,632,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11697/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,245,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11698/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,246,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11699/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,246,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11700/500000]
+ optim/total_grad_norm=9.215
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,246,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11701/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,246,592,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11702/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,246,784,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11703/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,246,976,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11704/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,247,168,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11705/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,247,360,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11706/500000]
+ train/ActionL1Loss=0.0153
+ throughput/total_tokens=2,247,552,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11707/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,247,744,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11708/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,247,936,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11709/500000]
+ train/ActionL1Loss=0.0255
+ throughput/total_tokens=2,248,128,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11710/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,248,320,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=11711/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,248,512,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11712/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,248,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11713/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,248,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11714/500000]
+ train/ActionL1Loss=0.0150
+ throughput/total_tokens=2,249,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11715/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,249,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11716/500000]
+ train/ActionL1Loss=0.0281
+ throughput/total_tokens=2,249,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11717/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,249,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11718/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,249,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11719/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,250,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11720/500000]
+ optim/total_grad_norm=8.683
+ train/ActionL1Loss=0.0239
+ throughput/total_tokens=2,250,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11721/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,250,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11722/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,250,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11723/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,250,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11724/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,251,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11725/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,251,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11726/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,251,392,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11727/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,251,584,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11728/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,251,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11729/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,251,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11730/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,252,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11731/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,252,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11732/500000]
+ train/ActionL1Loss=0.0298
+ throughput/total_tokens=2,252,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11733/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,252,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11734/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,252,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11735/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,253,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11736/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,253,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11737/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,253,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11738/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,253,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11739/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,253,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11740/500000]
+ optim/total_grad_norm=8.743
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,254,080,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11741/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,254,272,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11742/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,254,464,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11743/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,254,656,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11744/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,254,848,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11745/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,255,040,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11746/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,255,232,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11747/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,255,424,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11748/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=2,255,616,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11749/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,255,808,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11750/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,256,000,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11751/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,256,192,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11752/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=2,256,384,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11753/500000]
+ train/ActionL1Loss=0.0258
+ throughput/total_tokens=2,256,576,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11754/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,256,768,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11755/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,256,960,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11756/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,257,152,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11757/500000]
+ train/ActionL1Loss=0.0256
+ throughput/total_tokens=2,257,344,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11758/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,257,536,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11759/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,257,728,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11760/500000]
+ optim/total_grad_norm=10.42
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,257,920,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=11761/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=2,258,112,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=11762/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,258,304,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11763/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,258,496,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11764/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,258,688,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11765/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,258,880,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11766/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,259,072,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11767/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,259,264,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11768/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,259,456,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11769/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,259,648,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=11770/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,259,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11771/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,260,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11772/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=2,260,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11773/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,260,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11774/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,260,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11775/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,260,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11776/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,260,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11777/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,261,184,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11778/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,261,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11779/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,261,568,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11780/500000]
+ optim/total_grad_norm=6.720
+ train/ActionL1Loss=0.0153
+ throughput/total_tokens=2,261,760,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11781/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,261,952,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11782/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,262,144,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11783/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,262,336,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11784/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,262,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11785/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,262,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11786/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,262,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11787/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,263,104,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11788/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,263,296,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11789/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,263,488,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11790/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,263,680,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11791/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,263,872,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11792/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,264,064,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11793/500000]
+ train/ActionL1Loss=0.0150
+ throughput/total_tokens=2,264,256,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11794/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,264,448,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11795/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,264,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11796/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,264,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11797/500000]
+ train/ActionL1Loss=0.0150
+ throughput/total_tokens=2,265,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11798/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=2,265,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11799/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,265,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11800/500000]
+ optim/total_grad_norm=7.774
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,265,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11801/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,265,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11802/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,265,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11803/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,266,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11804/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,266,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11805/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,266,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11806/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,266,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11807/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,266,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11808/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,267,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11809/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,267,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11810/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,267,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11811/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,267,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11812/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,267,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11813/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,268,096,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11814/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,268,288,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11815/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,268,480,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11816/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,268,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11817/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,268,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11818/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,269,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11819/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,269,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11820/500000]
+ optim/total_grad_norm=7.566
+ train/ActionL1Loss=0.0250
+ throughput/total_tokens=2,269,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11821/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,269,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11822/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,269,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11823/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,270,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11824/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,270,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11825/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,270,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11826/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,270,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11827/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,270,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11828/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,270,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=11829/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,271,168,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11830/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,271,360,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11831/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,271,552,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11832/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,271,744,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11833/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,271,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11834/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,272,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11835/500000]
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,272,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11836/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,272,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11837/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,272,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11838/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,272,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11839/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,273,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11840/500000]
+ optim/total_grad_norm=9.474
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,273,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11841/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=2,273,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11842/500000]
+ train/ActionL1Loss=0.0296
+ throughput/total_tokens=2,273,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11843/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,273,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11844/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,274,048,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11845/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,274,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11846/500000]
+ train/ActionL1Loss=0.0148
+ throughput/total_tokens=2,274,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11847/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,274,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11848/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,274,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11849/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,275,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11850/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,275,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11851/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,275,392,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11852/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,275,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11853/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,275,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11854/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,275,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11855/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,276,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11856/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,276,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11857/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,276,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11858/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,276,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11859/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,276,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11860/500000]
+ optim/total_grad_norm=7.408
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,277,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=11861/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,277,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11862/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,277,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11863/500000]
+ train/ActionL1Loss=0.0140
+ throughput/total_tokens=2,277,696,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11864/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,277,888,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11865/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,278,080,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11866/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,278,272,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11867/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,278,464,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11868/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,278,656,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11869/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=2,278,848,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11870/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,279,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11871/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,279,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11872/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,279,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11873/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,279,616,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11874/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,279,808,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11875/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,280,000,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11876/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,280,192,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11877/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,280,384,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11878/500000]
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=2,280,576,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11879/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,280,768,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11880/500000]
+ optim/total_grad_norm=8.800
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,280,960,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11881/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,281,152,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11882/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,281,344,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11883/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,281,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11884/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,281,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11885/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,281,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11886/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,282,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11887/500000]
+ train/ActionL1Loss=0.0150
+ throughput/total_tokens=2,282,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11888/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,282,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11889/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,282,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11890/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=2,282,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11891/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,283,072,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11892/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,283,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11893/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,283,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11894/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,283,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11895/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,283,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11896/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,284,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11897/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,284,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11898/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,284,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11899/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,284,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=11900/500000]
+ optim/total_grad_norm=8.503
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,284,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=11901/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,284,992,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11902/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,285,184,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11903/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,285,376,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11904/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,285,568,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11905/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,285,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11906/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,285,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11907/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,286,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11908/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,286,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11909/500000]
+ train/ActionL1Loss=0.0145
+ throughput/total_tokens=2,286,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11910/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,286,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=11911/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,286,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11912/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,287,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=11913/500000]
+ train/ActionL1Loss=0.0155
+ throughput/total_tokens=2,287,296,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11914/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,287,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11915/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,287,680,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11916/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,287,872,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11917/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,288,064,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11918/500000]
+ train/ActionL1Loss=0.0155
+ throughput/total_tokens=2,288,256,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11919/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,288,448,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=11920/500000]
+ optim/total_grad_norm=8.456
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,288,640,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11921/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,288,832,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11922/500000]
+ train/ActionL1Loss=0.0160
+ throughput/total_tokens=2,289,024,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11923/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,289,216,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11924/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,289,408,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11925/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,289,600,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11926/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,289,792,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11927/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,289,984,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11928/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,290,176,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11929/500000]
+ train/ActionL1Loss=0.0128
+ throughput/total_tokens=2,290,368,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11930/500000]
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=2,290,560,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11931/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,290,752,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11932/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,290,944,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11933/500000]
+ train/ActionL1Loss=0.0150
+ throughput/total_tokens=2,291,136,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11934/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,291,328,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11935/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,291,520,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11936/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,291,712,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11937/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,291,904,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11938/500000]
+ train/ActionL1Loss=0.0144
+ throughput/total_tokens=2,292,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11939/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,292,288,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11940/500000]
+ optim/total_grad_norm=8.732
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,292,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11941/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,292,672,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11942/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,292,864,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=11943/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,293,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11944/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,293,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11945/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,293,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11946/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,293,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11947/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,293,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11948/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,294,016,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11949/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,294,208,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11950/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,294,400,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11951/500000]
+ train/ActionL1Loss=0.0150
+ throughput/total_tokens=2,294,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11952/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,294,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11953/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,294,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11954/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,295,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11955/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,295,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11956/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,295,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11957/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,295,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11958/500000]
+ train/ActionL1Loss=0.0136
+ throughput/total_tokens=2,295,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11959/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,296,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11960/500000]
+ optim/total_grad_norm=8.854
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,296,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=11961/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,296,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11962/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,296,704,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11963/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,296,896,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11964/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,297,088,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11965/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,297,280,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11966/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,297,472,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=11967/500000]
+ train/ActionL1Loss=0.0134
+ throughput/total_tokens=2,297,664,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11968/500000]
+ train/ActionL1Loss=0.0140
+ throughput/total_tokens=2,297,856,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11969/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,298,048,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=11970/500000]
+ train/ActionL1Loss=0.0145
+ throughput/total_tokens=2,298,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11971/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,298,432,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11972/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,298,624,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11973/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,298,816,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11974/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,299,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11975/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,299,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11976/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,299,392,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11977/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,299,584,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11978/500000]
+ train/ActionL1Loss=0.0160
+ throughput/total_tokens=2,299,776,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11979/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,299,968,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11980/500000]
+ optim/total_grad_norm=7.972
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,300,160,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11981/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,300,352,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11982/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,300,544,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11983/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,300,736,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11984/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,300,928,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11985/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,301,120,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11986/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,301,312,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11987/500000]
+ train/ActionL1Loss=0.0155
+ throughput/total_tokens=2,301,504,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11988/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,301,696,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11989/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,301,888,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11990/500000]
+ train/ActionL1Loss=0.0280
+ throughput/total_tokens=2,302,080,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=11991/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=2,302,272,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11992/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,302,464,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11993/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,302,656,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11994/500000]
+ train/ActionL1Loss=0.0143
+ throughput/total_tokens=2,302,848,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11995/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,303,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11996/500000]
+ train/ActionL1Loss=0.0264
+ throughput/total_tokens=2,303,232,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11997/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,303,424,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11998/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,303,616,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=11999/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,303,808,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12000/500000]
+ optim/total_grad_norm=7.862
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,304,000,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+10/05 [14:01:11] INFO | >> Saving config... checkpoint.py:608
+10/05 [14:02:02] INFO | >> Saving model state... checkpoint.py:796
+10/05 [14:03:14] INFO | >> Saving optim state... checkpoint.py:811
+10/05 [14:04:45] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=12001/500000]
+ train/ActionL1Loss=0.0247
+ throughput/total_tokens=2,304,192,000
+ throughput/device/tokens_per_second=1,220
+ throughput/device/batches_per_second=0.0509
+[step=12002/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,304,384,000
+ throughput/device/tokens_per_second=1,201
+ throughput/device/batches_per_second=0.0501
+[step=12003/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,304,576,000
+ throughput/device/tokens_per_second=1,195
+ throughput/device/batches_per_second=0.0498
+[step=12004/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,304,768,000
+ throughput/device/tokens_per_second=1,192
+ throughput/device/batches_per_second=0.0497
+[step=12005/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,304,960,000
+ throughput/device/tokens_per_second=1,190
+ throughput/device/batches_per_second=0.0496
+[step=12006/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,305,152,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=12007/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,305,344,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0496
+[step=12008/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,305,536,000
+ throughput/device/tokens_per_second=1,189
+ throughput/device/batches_per_second=0.0495
+[step=12009/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,305,728,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=12010/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,305,920,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12011/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,306,112,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=12012/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=2,306,304,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=12013/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,306,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12014/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,306,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12015/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,306,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12016/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,307,072,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12017/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,307,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12018/500000]
+ train/ActionL1Loss=0.0252
+ throughput/total_tokens=2,307,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12019/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,307,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12020/500000]
+ optim/total_grad_norm=7.922
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,307,840,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12021/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,308,032,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12022/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,308,224,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12023/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,308,416,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12024/500000]
+ train/ActionL1Loss=0.0148
+ throughput/total_tokens=2,308,608,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12025/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,308,800,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12026/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,308,992,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12027/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,309,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12028/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,309,376,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12029/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,309,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12030/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,309,760,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12031/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,309,952,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12032/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,310,144,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12033/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,310,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12034/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,310,528,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12035/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,310,720,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12036/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,310,912,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12037/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,311,104,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12038/500000]
+ train/ActionL1Loss=0.0155
+ throughput/total_tokens=2,311,296,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12039/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,311,488,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12040/500000]
+ optim/total_grad_norm=7.809
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,311,680,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12041/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,311,872,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12042/500000]
+ train/ActionL1Loss=0.0156
+ throughput/total_tokens=2,312,064,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12043/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,312,256,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12044/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,312,448,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12045/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,312,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12046/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,312,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12047/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,313,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12048/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,313,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12049/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,313,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12050/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,313,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12051/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,313,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12052/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,313,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12053/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,314,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12054/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,314,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12055/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,314,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12056/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,314,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12057/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,314,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12058/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,315,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12059/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,315,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12060/500000]
+ optim/total_grad_norm=8.597
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,315,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=12061/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,315,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12062/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,315,904,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12063/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,316,096,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12064/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,316,288,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12065/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,316,480,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12066/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,316,672,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12067/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,316,864,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12068/500000]
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,317,056,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12069/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,317,248,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12070/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,317,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12071/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,317,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12072/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,317,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12073/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,318,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12074/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,318,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12075/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,318,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12076/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,318,592,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12077/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,318,784,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12078/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,318,976,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12079/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,319,168,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12080/500000]
+ optim/total_grad_norm=9.039
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,319,360,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12081/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,319,552,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12082/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,319,744,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12083/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,319,936,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12084/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,320,128,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12085/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,320,320,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12086/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,320,512,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12087/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,320,704,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12088/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,320,896,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12089/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,321,088,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12090/500000]
+ train/ActionL1Loss=0.0210
+ throughput/total_tokens=2,321,280,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12091/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,321,472,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12092/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,321,664,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12093/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,321,856,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12094/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,322,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12095/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,322,240,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12096/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,322,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12097/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=2,322,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12098/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,322,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12099/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,323,008,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12100/500000]
+ optim/total_grad_norm=8.390
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,323,200,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12101/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,323,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=12102/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,323,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=12103/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,323,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12104/500000]
+ train/ActionL1Loss=0.0234
+ throughput/total_tokens=2,323,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12105/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,324,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12106/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,324,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12107/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,324,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12108/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,324,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12109/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,324,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12110/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,325,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=46,917
+[step=12111/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,325,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12112/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,325,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12113/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,325,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12114/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,325,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12115/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,326,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12116/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,326,272,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=12117/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,326,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=12118/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,326,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=12119/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,326,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=12120/500000]
+ optim/total_grad_norm=9.437
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,327,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12121/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,327,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12122/500000]
+ train/ActionL1Loss=0.0160
+ throughput/total_tokens=2,327,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12123/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=2,327,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12124/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,327,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12125/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,328,000,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12126/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,328,192,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12127/500000]
+ train/ActionL1Loss=0.0262
+ throughput/total_tokens=2,328,384,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12128/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,328,576,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12129/500000]
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,328,768,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12130/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,328,960,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12131/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,329,152,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12132/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,329,344,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12133/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=2,329,536,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12134/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=2,329,728,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12135/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,329,920,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12136/500000]
+ train/ActionL1Loss=0.0265
+ throughput/total_tokens=2,330,112,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12137/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,330,304,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12138/500000]
+ train/ActionL1Loss=0.0241
+ throughput/total_tokens=2,330,496,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12139/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,330,688,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12140/500000]
+ optim/total_grad_norm=8.131
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,330,880,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12141/500000]
+ train/ActionL1Loss=0.0260
+ throughput/total_tokens=2,331,072,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12142/500000]
+ train/ActionL1Loss=0.0261
+ throughput/total_tokens=2,331,264,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12143/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,331,456,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12144/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,331,648,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12145/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,331,840,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12146/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,332,032,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12147/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,332,224,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12148/500000]
+ train/ActionL1Loss=0.0173
+ throughput/total_tokens=2,332,416,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12149/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,332,608,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12150/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,332,800,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12151/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,332,992,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12152/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,333,184,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12153/500000]
+ train/ActionL1Loss=0.0259
+ throughput/total_tokens=2,333,376,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12154/500000]
+ train/ActionL1Loss=0.0215
+ throughput/total_tokens=2,333,568,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12155/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,333,760,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12156/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,333,952,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12157/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,334,144,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12158/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,334,336,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12159/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,334,528,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12160/500000]
+ optim/total_grad_norm=7.838
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,334,720,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=12161/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=2,334,912,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12162/500000]
+ train/ActionL1Loss=0.0240
+ throughput/total_tokens=2,335,104,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12163/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,335,296,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12164/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,335,488,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12165/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,335,680,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12166/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,335,872,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=12167/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,336,064,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=12168/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,336,256,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=12169/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,336,448,000
+ throughput/device/tokens_per_second=1,181
+ throughput/device/batches_per_second=0.0492
+[step=12170/500000]
+ train/ActionL1Loss=0.0156
+ throughput/total_tokens=2,336,640,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=12171/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,336,832,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12172/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,337,024,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12173/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,337,216,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12174/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,337,408,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12175/500000]
+ train/ActionL1Loss=0.0245
+ throughput/total_tokens=2,337,600,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12176/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,337,792,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12177/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,337,984,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12178/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,338,176,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12179/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,338,368,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12180/500000]
+ optim/total_grad_norm=8.048
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,338,560,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12181/500000]
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,338,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12182/500000]
+ train/ActionL1Loss=0.0220
+ throughput/total_tokens=2,338,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12183/500000]
+ train/ActionL1Loss=0.0145
+ throughput/total_tokens=2,339,136,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12184/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,339,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12185/500000]
+ train/ActionL1Loss=0.0254
+ throughput/total_tokens=2,339,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12186/500000]
+ train/ActionL1Loss=0.0147
+ throughput/total_tokens=2,339,712,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12187/500000]
+ train/ActionL1Loss=0.0138
+ throughput/total_tokens=2,339,904,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12188/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,340,096,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12189/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,340,288,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12190/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,340,480,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12191/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,340,672,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12192/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,340,864,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12193/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,341,056,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12194/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,341,248,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12195/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,341,440,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12196/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,341,632,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12197/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,341,824,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12198/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,342,016,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12199/500000]
+ train/ActionL1Loss=0.0145
+ throughput/total_tokens=2,342,208,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12200/500000]
+ optim/total_grad_norm=9.837
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,342,400,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12201/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,342,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12202/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,342,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12203/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,342,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12204/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,343,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12205/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,343,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12206/500000]
+ train/ActionL1Loss=0.0160
+ throughput/total_tokens=2,343,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12207/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,343,744,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12208/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,343,936,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12209/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,344,128,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12210/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,344,320,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=12211/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,344,512,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12212/500000]
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,344,704,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12213/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,344,896,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12214/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,345,088,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12215/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,345,280,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12216/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,345,472,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12217/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,345,664,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12218/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,345,856,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12219/500000]
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,346,048,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12220/500000]
+ optim/total_grad_norm=9.501
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,346,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12221/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,346,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12222/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,346,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12223/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,346,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12224/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,347,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12225/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,347,200,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12226/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,347,392,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12227/500000]
+ train/ActionL1Loss=0.0162
+ throughput/total_tokens=2,347,584,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12228/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,347,776,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12229/500000]
+ train/ActionL1Loss=0.0230
+ throughput/total_tokens=2,347,968,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12230/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,348,160,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12231/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,348,352,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12232/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,348,544,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12233/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,348,736,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12234/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,348,928,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12235/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,349,120,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12236/500000]
+ train/ActionL1Loss=0.0216
+ throughput/total_tokens=2,349,312,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12237/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,349,504,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12238/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,349,696,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12239/500000]
+ train/ActionL1Loss=0.0212
+ throughput/total_tokens=2,349,888,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12240/500000]
+ optim/total_grad_norm=7.000
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,350,080,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12241/500000]
+ train/ActionL1Loss=0.0138
+ throughput/total_tokens=2,350,272,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12242/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,350,464,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12243/500000]
+ train/ActionL1Loss=0.0181
+ throughput/total_tokens=2,350,656,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12244/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,350,848,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12245/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,351,040,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12246/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,351,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12247/500000]
+ train/ActionL1Loss=0.0223
+ throughput/total_tokens=2,351,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12248/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,351,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12249/500000]
+ train/ActionL1Loss=0.0203
+ throughput/total_tokens=2,351,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12250/500000]
+ train/ActionL1Loss=0.0144
+ throughput/total_tokens=2,352,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12251/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,352,192,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12252/500000]
+ train/ActionL1Loss=0.0165
+ throughput/total_tokens=2,352,384,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12253/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,352,576,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12254/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,352,768,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12255/500000]
+ train/ActionL1Loss=0.0221
+ throughput/total_tokens=2,352,960,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12256/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,353,152,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12257/500000]
+ train/ActionL1Loss=0.0200
+ throughput/total_tokens=2,353,344,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12258/500000]
+ train/ActionL1Loss=0.0272
+ throughput/total_tokens=2,353,536,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12259/500000]
+ train/ActionL1Loss=0.0233
+ throughput/total_tokens=2,353,728,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12260/500000]
+ optim/total_grad_norm=8.996
+ train/ActionL1Loss=0.0217
+ throughput/total_tokens=2,353,920,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=12261/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,354,112,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12262/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,354,304,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12263/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,354,496,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12264/500000]
+ train/ActionL1Loss=0.0232
+ throughput/total_tokens=2,354,688,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12265/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,354,880,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12266/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=2,355,072,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12267/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,355,264,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12268/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,355,456,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12269/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,355,648,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12270/500000]
+ train/ActionL1Loss=0.0270
+ throughput/total_tokens=2,355,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12271/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=2,356,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12272/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,356,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12273/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,356,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12274/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,356,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12275/500000]
+ train/ActionL1Loss=0.0188
+ throughput/total_tokens=2,356,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12276/500000]
+ train/ActionL1Loss=0.0208
+ throughput/total_tokens=2,356,992,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12277/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,357,184,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12278/500000]
+ train/ActionL1Loss=0.0238
+ throughput/total_tokens=2,357,376,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12279/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,357,568,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12280/500000]
+ optim/total_grad_norm=7.938
+ train/ActionL1Loss=0.0231
+ throughput/total_tokens=2,357,760,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12281/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,357,952,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12282/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,358,144,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12283/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,358,336,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12284/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,358,528,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12285/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,358,720,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12286/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,358,912,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12287/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,359,104,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12288/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,359,296,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12289/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,359,488,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12290/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,359,680,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12291/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,359,872,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12292/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,360,064,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12293/500000]
+ train/ActionL1Loss=0.0236
+ throughput/total_tokens=2,360,256,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12294/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,360,448,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12295/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,360,640,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12296/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,360,832,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12297/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,361,024,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12298/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,361,216,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12299/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,361,408,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12300/500000]
+ optim/total_grad_norm=9.323
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,361,600,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12301/500000]
+ train/ActionL1Loss=0.0197
+ throughput/total_tokens=2,361,792,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12302/500000]
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=2,361,984,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12303/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,362,176,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12304/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,362,368,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12305/500000]
+ train/ActionL1Loss=0.0222
+ throughput/total_tokens=2,362,560,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12306/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,362,752,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12307/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,362,944,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12308/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,363,136,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12309/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,363,328,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12310/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,363,520,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=12311/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,363,712,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12312/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,363,904,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12313/500000]
+ train/ActionL1Loss=0.0227
+ throughput/total_tokens=2,364,096,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12314/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,364,288,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12315/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,364,480,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12316/500000]
+ train/ActionL1Loss=0.0163
+ throughput/total_tokens=2,364,672,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12317/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,364,864,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12318/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,365,056,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12319/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,365,248,000
+ throughput/device/tokens_per_second=1,182
+ throughput/device/batches_per_second=0.0493
+[step=12320/500000]
+ optim/total_grad_norm=7.445
+ train/ActionL1Loss=0.0180
+ throughput/total_tokens=2,365,440,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12321/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,365,632,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12322/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,365,824,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12323/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,366,016,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12324/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,366,208,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12325/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,366,400,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12326/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,366,592,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12327/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,366,784,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12328/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,366,976,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12329/500000]
+ train/ActionL1Loss=0.0167
+ throughput/total_tokens=2,367,168,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12330/500000]
+ train/ActionL1Loss=0.0147
+ throughput/total_tokens=2,367,360,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12331/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,367,552,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12332/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,367,744,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12333/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,367,936,000
+ throughput/device/tokens_per_second=1,185
+ throughput/device/batches_per_second=0.0494
+[step=12334/500000]
+ train/ActionL1Loss=0.0205
+ throughput/total_tokens=2,368,128,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12335/500000]
+ train/ActionL1Loss=0.0182
+ throughput/total_tokens=2,368,320,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12336/500000]
+ train/ActionL1Loss=0.0166
+ throughput/total_tokens=2,368,512,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12337/500000]
+ train/ActionL1Loss=0.0145
+ throughput/total_tokens=2,368,704,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12338/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,368,896,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12339/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,369,088,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12340/500000]
+ optim/total_grad_norm=7.104
+ train/ActionL1Loss=0.0168
+ throughput/total_tokens=2,369,280,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12341/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,369,472,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12342/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,369,664,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12343/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,369,856,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12344/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,370,048,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12345/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,370,240,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12346/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,370,432,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12347/500000]
+ train/ActionL1Loss=0.0189
+ throughput/total_tokens=2,370,624,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12348/500000]
+ train/ActionL1Loss=0.0193
+ throughput/total_tokens=2,370,816,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12349/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,371,008,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12350/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,371,200,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+ System/Peak GPU Memory (MB)=46,917
+[step=12351/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,371,392,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12352/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,371,584,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12353/500000]
+ train/ActionL1Loss=0.0253
+ throughput/total_tokens=2,371,776,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12354/500000]
+ train/ActionL1Loss=0.0284
+ throughput/total_tokens=2,371,968,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12355/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,372,160,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12356/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,372,352,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0494
+[step=12357/500000]
+ train/ActionL1Loss=0.0158
+ throughput/total_tokens=2,372,544,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12358/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,372,736,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12359/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,372,928,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12360/500000]
+ optim/total_grad_norm=7.981
+ train/ActionL1Loss=0.0179
+ throughput/total_tokens=2,373,120,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=12361/500000]
+ train/ActionL1Loss=0.0214
+ throughput/total_tokens=2,373,312,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12362/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,373,504,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12363/500000]
+ train/ActionL1Loss=0.0136
+ throughput/total_tokens=2,373,696,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12364/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,373,888,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12365/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,374,080,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12366/500000]
+ train/ActionL1Loss=0.0175
+ throughput/total_tokens=2,374,272,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12367/500000]
+ train/ActionL1Loss=0.0161
+ throughput/total_tokens=2,374,464,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12368/500000]
+ train/ActionL1Loss=0.0243
+ throughput/total_tokens=2,374,656,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12369/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,374,848,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12370/500000]
+ train/ActionL1Loss=0.0172
+ throughput/total_tokens=2,375,040,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12371/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,375,232,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12372/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,375,424,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12373/500000]
+ train/ActionL1Loss=0.0237
+ throughput/total_tokens=2,375,616,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12374/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,375,808,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12375/500000]
+ train/ActionL1Loss=0.0219
+ throughput/total_tokens=2,376,000,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12376/500000]
+ train/ActionL1Loss=0.0185
+ throughput/total_tokens=2,376,192,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0494
+[step=12377/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,376,384,000
+ throughput/device/tokens_per_second=1,186
+ throughput/device/batches_per_second=0.0495
+[step=12378/500000]
+ train/ActionL1Loss=0.0170
+ throughput/total_tokens=2,376,576,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12379/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,376,768,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12380/500000]
+ optim/total_grad_norm=6.220
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,376,960,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12381/500000]
+ train/ActionL1Loss=0.0145
+ throughput/total_tokens=2,377,152,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12382/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,377,344,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12383/500000]
+ train/ActionL1Loss=0.0192
+ throughput/total_tokens=2,377,536,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12384/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,377,728,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12385/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,377,920,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12386/500000]
+ train/ActionL1Loss=0.0155
+ throughput/total_tokens=2,378,112,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12387/500000]
+ train/ActionL1Loss=0.0235
+ throughput/total_tokens=2,378,304,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12388/500000]
+ train/ActionL1Loss=0.0157
+ throughput/total_tokens=2,378,496,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12389/500000]
+ train/ActionL1Loss=0.0156
+ throughput/total_tokens=2,378,688,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12390/500000]
+ train/ActionL1Loss=0.0213
+ throughput/total_tokens=2,378,880,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12391/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,379,072,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=12392/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,379,264,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12393/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,379,456,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12394/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,379,648,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12395/500000]
+ train/ActionL1Loss=0.0204
+ throughput/total_tokens=2,379,840,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12396/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,380,032,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12397/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,380,224,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12398/500000]
+ train/ActionL1Loss=0.0228
+ throughput/total_tokens=2,380,416,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12399/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,380,608,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12400/500000]
+ optim/total_grad_norm=7.581
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,380,800,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12401/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,380,992,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12402/500000]
+ train/ActionL1Loss=0.0151
+ throughput/total_tokens=2,381,184,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12403/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,381,376,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12404/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,381,568,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12405/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,381,760,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12406/500000]
+ train/ActionL1Loss=0.0194
+ throughput/total_tokens=2,381,952,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12407/500000]
+ train/ActionL1Loss=0.0191
+ throughput/total_tokens=2,382,144,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12408/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,382,336,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12409/500000]
+ train/ActionL1Loss=0.0174
+ throughput/total_tokens=2,382,528,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12410/500000]
+ train/ActionL1Loss=0.0154
+ throughput/total_tokens=2,382,720,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+ System/Peak GPU Memory (MB)=46,917
+[step=12411/500000]
+ train/ActionL1Loss=0.0187
+ throughput/total_tokens=2,382,912,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12412/500000]
+ train/ActionL1Loss=0.0195
+ throughput/total_tokens=2,383,104,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12413/500000]
+ train/ActionL1Loss=0.0186
+ throughput/total_tokens=2,383,296,000
+ throughput/device/tokens_per_second=1,183
+ throughput/device/batches_per_second=0.0493
+[step=12414/500000]
+ train/ActionL1Loss=0.0153
+ throughput/total_tokens=2,383,488,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12415/500000]
+ train/ActionL1Loss=0.0190
+ throughput/total_tokens=2,383,680,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12416/500000]
+ train/ActionL1Loss=0.0176
+ throughput/total_tokens=2,383,872,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12417/500000]
+ train/ActionL1Loss=0.0169
+ throughput/total_tokens=2,384,064,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12418/500000]
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=2,384,256,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12419/500000]
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,384,448,000
+ throughput/device/tokens_per_second=1,184
+ throughput/device/batches_per_second=0.0493
+[step=12420/500000]
+ optim/total_grad_norm=8.997
+ train/ActionL1Loss=0.0198
+ throughput/total_tokens=2,384,640,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12421/500000]
+ train/ActionL1Loss=0.0225
+ throughput/total_tokens=2,384,832,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12422/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,385,024,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12423/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,385,216,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12424/500000]
+ train/ActionL1Loss=0.0199
+ throughput/total_tokens=2,385,408,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12425/500000]
+ train/ActionL1Loss=0.0177
+ throughput/total_tokens=2,385,600,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12426/500000]
+ train/ActionL1Loss=0.0224
+ throughput/total_tokens=2,385,792,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12427/500000]
+ train/ActionL1Loss=0.0206
+ throughput/total_tokens=2,385,984,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12428/500000]
+ train/ActionL1Loss=0.0226
+ throughput/total_tokens=2,386,176,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12429/500000]
+ train/ActionL1Loss=0.0211
+ throughput/total_tokens=2,386,368,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12430/500000]
+ train/ActionL1Loss=0.0171
+ throughput/total_tokens=2,386,560,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12431/500000]
+ train/ActionL1Loss=0.0201
+ throughput/total_tokens=2,386,752,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12432/500000]
+ train/ActionL1Loss=0.0244
+ throughput/total_tokens=2,386,944,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12433/500000]
+ train/ActionL1Loss=0.0207
+ throughput/total_tokens=2,387,136,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12434/500000]
+ train/ActionL1Loss=0.0178
+ throughput/total_tokens=2,387,328,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12435/500000]
+ train/ActionL1Loss=0.0209
+ throughput/total_tokens=2,387,520,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12436/500000]
+ train/ActionL1Loss=0.0218
+ throughput/total_tokens=2,387,712,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12437/500000]
+ train/ActionL1Loss=0.0140
+ throughput/total_tokens=2,387,904,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12438/500000]
+ train/ActionL1Loss=0.0152
+ throughput/total_tokens=2,388,096,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+[step=12439/500000]
+ train/ActionL1Loss=0.0196
+ throughput/total_tokens=2,388,288,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12440/500000]
+ optim/total_grad_norm=7.228
+ train/ActionL1Loss=0.0229
+ throughput/total_tokens=2,388,480,000
+ throughput/device/tokens_per_second=1,188
+ throughput/device/batches_per_second=0.0495
+ System/Peak GPU Memory (MB)=46,917
+[step=12441/500000]
+ train/ActionL1Loss=0.0164
+ throughput/total_tokens=2,388,672,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12442/500000]
+ train/ActionL1Loss=0.0143
+ throughput/total_tokens=2,388,864,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12443/500000]
+ train/ActionL1Loss=0.0183
+ throughput/total_tokens=2,389,056,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12444/500000]
+ train/ActionL1Loss=0.0159
+ throughput/total_tokens=2,389,248,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12445/500000]
+ train/ActionL1Loss=0.0143
+ throughput/total_tokens=2,389,440,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12446/500000]
+ train/ActionL1Loss=0.0202
+ throughput/total_tokens=2,389,632,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
+[step=12447/500000]
+ train/ActionL1Loss=0.0184
+ throughput/total_tokens=2,389,824,000
+ throughput/device/tokens_per_second=1,187
+ throughput/device/batches_per_second=0.0495
diff --git a/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/files/requirements.txt b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8
--- /dev/null
+++ b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/files/requirements.txt
@@ -0,0 +1,286 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+et_xmlfile==2.0.0
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+openpyxl==3.1.5
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/files/wandb-metadata.json b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..ffed95079d538fa2b99d9d7aafe16660e8477999
--- /dev/null
+++ b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-10-02T16:37:29.221472Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue_l1_regression",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "l1_regression",
+ "--seq_len",
+ "1600",
+ "--ft_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "16",
+ "--global_batch_size",
+ "126",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "glue",
+ "--real_world_vla_config_path",
+ "vla_config_realworld/vla_config_glue.yaml",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "5071f59d87c6a976691323cbac66d7a988b0b4e7"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/glue_l1_regression/wandb",
+ "host": "auh7-1b-gpu-282",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "470343073792",
+ "used": "50535075840"
+ }
+ },
+ "memory": {
+ "total": "2434606956544"
+ },
+ "gpu_amd": [
+ {
+ "id": "2",
+ "uniqueId": "0x492f172b602a22b5",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0x1af77dc455975108",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "7",
+ "uniqueId": "0x14a7fc56ac2e5e42",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x2e7a3afcefcaca4b",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0xb66ccb62112b0571",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0x63f0fe2c43bc1640",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0xcec181d5e2ce525",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xdaf531ba129c665e",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1759682204",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "2278",
+ "job_name": "mh_glue_l1_regression",
+ "job_nodelist": "auh7-1b-gpu-282",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1759423004",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "2278",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-282",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "3779894",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-282",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "5tngekiy76vcgqn1s8m1wijc9isok5tn"
+}
\ No newline at end of file
diff --git a/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/logs/debug-core.log b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..2bff196e2fe2e6f5c67217603bdc9f341c8b9479
--- /dev/null
+++ b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/logs/debug-core.log
@@ -0,0 +1,12 @@
+{"time":"2025-10-02T16:37:29.014245666Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpusl77j3_/port-2574789.txt","pid":2574789,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-10-02T16:37:29.016062848Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":2574789}
+{"time":"2025-10-02T16:37:29.016006867Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2574789-2574955-4107859315/socket","Net":"unix"}}
+{"time":"2025-10-02T16:37:29.198285234Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-10-02T16:37:29.205734663Z","level":"INFO","msg":"handleInformInit: received","streamId":"tmwli25x","id":"1(@)"}
+{"time":"2025-10-02T16:37:30.340260012Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"tmwli25x","id":"1(@)"}
+.txt","pid":3780083,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-10-02T16:37:29.282444644Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3780083}
+{"time":"2025-10-02T16:37:29.282434424Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3780083-3780247-3093816148/socket","Net":"unix"}}
+{"time":"2025-10-02T16:37:29.458879988Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-10-02T16:37:29.465619355Z","level":"INFO","msg":"handleInformInit: received","streamId":"7ovz4jzt","id":"1(@)"}
+{"time":"2025-10-02T16:37:30.493288413Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"7ovz4jzt","id":"1(@)"}
diff --git a/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/logs/debug-internal.log b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..f58c1475f78e716f565c85beed1b416156e7b5e0
--- /dev/null
+++ b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/logs/debug-internal.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-02T16:37:29.467576263Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-02T16:37:30.493240032Z","level":"INFO","msg":"stream: created new stream","id":"7ovz4jzt"}
+{"time":"2025-10-02T16:37:30.493282902Z","level":"INFO","msg":"stream: started","id":"7ovz4jzt"}
+{"time":"2025-10-02T16:37:30.493310273Z","level":"INFO","msg":"writer: started","stream_id":"7ovz4jzt"}
+{"time":"2025-10-02T16:37:30.493324013Z","level":"INFO","msg":"sender: started","stream_id":"7ovz4jzt"}
+{"time":"2025-10-02T16:37:30.493358514Z","level":"INFO","msg":"handler: started","stream_id":"7ovz4jzt"}
diff --git a/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/logs/debug.log b/glue_l1_regression/wandb/wandb/run-20251002_163729-7ovz4jzt/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/files/output.log b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/files/output.log
new file mode 100644
index 0000000000000000000000000000000000000000..791da1475e55cdac5b63d972d946265eafe63e11
--- /dev/null
+++ b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/files/output.log
@@ -0,0 +1,62529 @@
+wandb: Detected [openai] in use.
+wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
+wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
+10/11 [16:38:47] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Pen', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}}
+****** Skip RLDS main; path not found: None
+****** start build LeRobot main...
+build_tokenizer, cache_dir None tokenizer_dir None
+10/11 [16:38:48] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130
+10/11 [16:38:49] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:438
+****** before LeRobot dataset...
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Pen
+camera_keys: ['image', 'hand_left_image', 'hand_right_image'], state_key: state, action_key: actions
+****** length of the dataset: 17131
+10/11 [16:38:51] INFO | >> build_rlds_train_dataset: Loading train dataset: vla_dataset_realworld/train __init__.py:521
+****** Import RLDSBatchTransform, RLDSDataset successfully.
+****** before RLDS dataset...
+****** data_config.rlds_dataset_name: a1_real_world
+****** data_config.rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE
+214**************
+10/11 [16:38:52] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/fractal20220817_data/0.1.0/dataset_statistics_138513de447c9e5435c5a12cc1c4a3c6a6434524fbd28f4
+ 5463261fac12cf3fb.json.
+214**************
+10/11 [16:38:53] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/jaco_play/0.1.0/dataset_statistics_e081d4716a3da95df91c79d661ae59fa26a43da49db4bf8d716b622b56
+ 3b0ea3.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_cable_routing/0.1.0/dataset_statistics_08cb4c5b7c5e6c035fc84ea85b2d54c0c46ad608a8763
+ 4ebb18374088d23cd76.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/viola/0.1.0/dataset_statistics_2415d8f7de73c8761fedd7c2a9590667fb0d3fdd26664bf4c100222e5cdb89
+ b9.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_autolab_ur5/0.1.0/dataset_statistics_1b798b015e7b2c4e4396719e3aa4d43a2f400b2edf5dbb0
+ 820cb3df6943d8ddc.json.
+214**************
+10/11 [16:38:54] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/austin_buds_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_ccecde24cc01793b221
+ 4eb0c4c5d7cc0e3ccc623db99bd892b83552b20decfb7.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/nyu_franka_play_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_b0d79557eac3059
+ ebf9f679a8f044bd60403f0cba16a37e0df2fe1654416ffe7.json.
+214**************
+10/11 [16:38:55] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/furniture_bench_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_76735bab3752978
+ bef83e1341d3c8db0a0d5a10397247eb3e0459388dccfe698.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/austin_sailor_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_4127c515a9413766f
+ e40ac696d884550bc655a40952ef3ae457c404d31570123.json.
+214**************
+10/11 [16:38:56] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/austin_sirius_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_cb2e0273f80029a19
+ dc3dbb3a3a4118a5598e7bff3ff0245891255825b04b42a.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/dlr_edan_shared_control_converted_externally_to_rlds/0.1.0/dataset_statistics_b8984563fc3e7ea
+ c0803c667ef58c9deaf2e747683568306ea1d83505d532a76.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/utaustin_mutex/0.1.0/dataset_statistics_0a99ee5a8ce4a34ba018a7c0c742a1b74ab7abb7d7a3925f8596a
+ 3fc4eb8efc7.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_fanuc_manipulation/0.1.0/dataset_statistics_a98d349d0364668095ea3ca38c6785e94f35e5e5
+ 8e234c88fac83775a923b0d0.json.
+214**************
+10/11 [16:38:57] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/bc_z/0.1.0/dataset_statistics_8187209d5cb273687cc8666697219dae50914ae2bee7f03552bd85a91fcfe7a
+ 4.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/roboturk/0.1.0/dataset_statistics_3aa821e17a2937f941d4102cfadcb1154853cb45dcec07ccc66893b01f6
+ f1b40.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/toto/0.1.0/dataset_statistics_505a51eb76e85fe0969e8e70e45fb8c9ae5d3b1fae2851c7899bea91f74b979
+ 0.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/ucsd_kitchen_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_1f1a5f310a2d5a6edc
+ 0e217370e135c8c8598290f11f57025037adcb0d033926.json.
+214**************
+ INFO | >> [*] Loading existing dataset statistics from data_utils.py:200
+ /vast/users/xiaodan/zhangjian/datasets/OXE/iamlab_cmu_pickup_insert_converted_externally_to_rlds/0.1.0/dataset_statistics_698a1f892f8866
+ af9cb4bd5a23611fa44d8c7d9d816f9b3049d2fc3b62442079.json.
+
+######################################################################################
+# Loading the following 18 datasets (incl. sampling weight): #
+# fractal20220817_data: ====================================================0.529250 #
+# jaco_play: ===============================================================0.010898 #
+# berkeley_cable_routing: ==================================================0.005916 #
+# viola: ===================================================================0.021337 #
+# berkeley_autolab_ur5: ====================================================0.027379 #
+# austin_buds_dataset_converted_externally_to_rlds: ========================0.004768 #
+# nyu_franka_play_dataset_converted_externally_to_rlds: ====================0.018817 #
+# furniture_bench_dataset_converted_externally_to_rlds: ====================0.055185 #
+# austin_sailor_dataset_converted_externally_to_rlds: ======================0.049354 #
+# austin_sirius_dataset_converted_externally_to_rlds: ======================0.039129 #
+# dlr_edan_shared_control_converted_externally_to_rlds: ====================0.001248 #
+# utaustin_mutex: ==========================================================0.050583 #
+# berkeley_fanuc_manipulation: =============================================0.017504 #
+# bc_z: ====================================================================0.168166 #
+# roboturk: ================================================================0.000131 #
+# toto: ====================================================================0.000228 #
+# ucsd_kitchen_dataset_converted_externally_to_rlds: =======================0.000006 #
+# iamlab_cmu_pickup_insert_converted_externally_to_rlds: ===================0.000102 #
+######################################################################################
+
+10/11 [16:38:58] INFO | >> [*] Threads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:563
+ INFO | >> [*] Reads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:564
+ INFO | >> [*] Constructing datasets... dataset.py:567
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+214**************
+10/11 [16:39:02] INFO | >> [*] Applying frame transforms on dataset... dataset.py:607
+****** after RLDSDataset initialization!
+****** length of the dataset: 7154275
+****** Build rlds train dataset: IterableDatasetWrapper successfully.
+****** path: None
+****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None
+****** After build vla train dataset...
+****** iterable_sources: [, ]
+****** Before build mixed iterable dataset...
+****** Build vla train dataloader successfully!
+************************* Build train_dataloader successful!
+************************* Before build_inf_evaluators
+10/11 [16:39:03] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109
+ device id is provided via `init_process_group` or `barrier `. Using the current device set by the user.
+ warnings.warn( # warn only once
+
+************************* Build evaluators successful!
+************************* Early exit flags: early_exit=False
+PROPRIO_DIM 16 does not match ACTION_DIM 16 for AffordVLA
+************************* Initialize model successful!
+***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt
+***** Load checkpoint successful!
+missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_
+unexpected keys: []
+************************* Initialize model successful!
+************************* Before FSDP model wrapping
+************************* FSDP model wrapping successful!
+************************* Before building optimizer and scheduler
+10/11 [16:40:44] INFO | >> Constructing optimizer with 2 param groups optim.py:1283
+**************************************************
+After building optimizer and scheduler and model, before training, peak GPU memory (MB): 36856
+************************* VLATrainer initialized successfully!
+************************* Before trainer.fit()
+Pre-train system metrics
+ System/Peak GPU Memory (MB)=36,856
+10/11 [16:41:12] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py:967: UserWarning: The .grad attribute warnings.py:109
+ of a Tensor that is not a leaf Tensor is being accessed. Its .grad attribute won't be populated during autograd.backward(). If you indeed
+ want the .grad field to be populated for a non-leaf Tensor, use .retain_grad() on the non-leaf Tensor. If you access the non-leaf Tensor
+ by mistake, make sure you access the leaf Tensor instead. See github.com/pytorch/pytorch/pull/30531 for more informations. (Triggered
+ internally at /pytorch/build/aten/src/ATen/core/TensorBody.h:489.)
+ param_grad = param.grad
+
+[step=1/500000]
+ train/ActionNoiseL2Loss=1.519
+ throughput/total_tokens=192,000
+ System/Peak GPU Memory (MB)=44,240
+[step=2/500000]
+ train/ActionNoiseL2Loss=1.502
+ throughput/total_tokens=384,000
+ throughput/device/tokens_per_second=1,173
+ throughput/device/batches_per_second=0.0489
+ System/Peak GPU Memory (MB)=51,055
+[step=3/500000]
+ train/ActionNoiseL2Loss=1.585
+ throughput/total_tokens=576,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=4/500000]
+ train/ActionNoiseL2Loss=1.586
+ throughput/total_tokens=768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5/500000]
+ train/ActionNoiseL2Loss=1.485
+ throughput/total_tokens=960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6/500000]
+ train/ActionNoiseL2Loss=1.494
+ throughput/total_tokens=1,152,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=7/500000]
+ train/ActionNoiseL2Loss=1.422
+ throughput/total_tokens=1,344,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8/500000]
+ train/ActionNoiseL2Loss=1.405
+ throughput/total_tokens=1,536,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9/500000]
+ train/ActionNoiseL2Loss=1.447
+ throughput/total_tokens=1,728,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=10/500000]
+ train/ActionNoiseL2Loss=1.275
+ throughput/total_tokens=1,920,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,072
+[step=11/500000]
+ train/ActionNoiseL2Loss=1.315
+ throughput/total_tokens=2,112,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=12/500000]
+ train/ActionNoiseL2Loss=1.292
+ throughput/total_tokens=2,304,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=13/500000]
+ train/ActionNoiseL2Loss=1.195
+ throughput/total_tokens=2,496,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=14/500000]
+ train/ActionNoiseL2Loss=1.292
+ throughput/total_tokens=2,688,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=15/500000]
+ train/ActionNoiseL2Loss=1.310
+ throughput/total_tokens=2,880,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=16/500000]
+ train/ActionNoiseL2Loss=1.249
+ throughput/total_tokens=3,072,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=17/500000]
+ train/ActionNoiseL2Loss=1.183
+ throughput/total_tokens=3,264,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=18/500000]
+ train/ActionNoiseL2Loss=1.158
+ throughput/total_tokens=3,456,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=19/500000]
+ train/ActionNoiseL2Loss=1.215
+ throughput/total_tokens=3,648,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=20/500000]
+ optim/total_grad_norm=12.39
+ train/ActionNoiseL2Loss=1.170
+ throughput/total_tokens=3,840,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,073
+[step=21/500000]
+ train/ActionNoiseL2Loss=1.165
+ throughput/total_tokens=4,032,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=22/500000]
+ train/ActionNoiseL2Loss=1.291
+ throughput/total_tokens=4,224,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=23/500000]
+ train/ActionNoiseL2Loss=1.178
+ throughput/total_tokens=4,416,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=24/500000]
+ train/ActionNoiseL2Loss=1.042
+ throughput/total_tokens=4,608,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=25/500000]
+ train/ActionNoiseL2Loss=1.094
+ throughput/total_tokens=4,800,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=26/500000]
+ train/ActionNoiseL2Loss=1.126
+ throughput/total_tokens=4,992,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=27/500000]
+ train/ActionNoiseL2Loss=1.099
+ throughput/total_tokens=5,184,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=28/500000]
+ train/ActionNoiseL2Loss=1.033
+ throughput/total_tokens=5,376,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=29/500000]
+ train/ActionNoiseL2Loss=1.031
+ throughput/total_tokens=5,568,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=30/500000]
+ train/ActionNoiseL2Loss=1.033
+ throughput/total_tokens=5,760,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=31/500000]
+ train/ActionNoiseL2Loss=0.9048
+ throughput/total_tokens=5,952,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=32/500000]
+ train/ActionNoiseL2Loss=0.8875
+ throughput/total_tokens=6,144,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=33/500000]
+ train/ActionNoiseL2Loss=1.080
+ throughput/total_tokens=6,336,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=34/500000]
+ train/ActionNoiseL2Loss=0.9100
+ throughput/total_tokens=6,528,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=35/500000]
+ train/ActionNoiseL2Loss=0.9351
+ throughput/total_tokens=6,720,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=36/500000]
+ train/ActionNoiseL2Loss=0.9959
+ throughput/total_tokens=6,912,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=37/500000]
+ train/ActionNoiseL2Loss=0.8505
+ throughput/total_tokens=7,104,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=38/500000]
+ train/ActionNoiseL2Loss=0.8500
+ throughput/total_tokens=7,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=39/500000]
+ train/ActionNoiseL2Loss=0.9952
+ throughput/total_tokens=7,488,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=40/500000]
+ optim/total_grad_norm=9.711
+ train/ActionNoiseL2Loss=0.8173
+ throughput/total_tokens=7,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=41/500000]
+ train/ActionNoiseL2Loss=0.7943
+ throughput/total_tokens=7,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=42/500000]
+ train/ActionNoiseL2Loss=0.8186
+ throughput/total_tokens=8,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=43/500000]
+ train/ActionNoiseL2Loss=0.9047
+ throughput/total_tokens=8,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=44/500000]
+ train/ActionNoiseL2Loss=0.9397
+ throughput/total_tokens=8,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=45/500000]
+ train/ActionNoiseL2Loss=0.7972
+ throughput/total_tokens=8,640,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=46/500000]
+ train/ActionNoiseL2Loss=0.8425
+ throughput/total_tokens=8,832,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=47/500000]
+ train/ActionNoiseL2Loss=0.8896
+ throughput/total_tokens=9,024,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=48/500000]
+ train/ActionNoiseL2Loss=0.8243
+ throughput/total_tokens=9,216,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=49/500000]
+ train/ActionNoiseL2Loss=0.7242
+ throughput/total_tokens=9,408,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=50/500000]
+ train/ActionNoiseL2Loss=0.7551
+ throughput/total_tokens=9,600,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=51/500000]
+ train/ActionNoiseL2Loss=0.6678
+ throughput/total_tokens=9,792,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=52/500000]
+ train/ActionNoiseL2Loss=0.7104
+ throughput/total_tokens=9,984,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=53/500000]
+ train/ActionNoiseL2Loss=0.7075
+ throughput/total_tokens=10,176,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=54/500000]
+ train/ActionNoiseL2Loss=0.7741
+ throughput/total_tokens=10,368,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=55/500000]
+ train/ActionNoiseL2Loss=0.7664
+ throughput/total_tokens=10,560,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=56/500000]
+ train/ActionNoiseL2Loss=0.8044
+ throughput/total_tokens=10,752,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=57/500000]
+ train/ActionNoiseL2Loss=0.7339
+ throughput/total_tokens=10,944,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=58/500000]
+ train/ActionNoiseL2Loss=0.6304
+ throughput/total_tokens=11,136,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=59/500000]
+ train/ActionNoiseL2Loss=0.6816
+ throughput/total_tokens=11,328,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=60/500000]
+ optim/total_grad_norm=8.873
+ train/ActionNoiseL2Loss=0.6181
+ throughput/total_tokens=11,520,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=51,073
+[step=61/500000]
+ train/ActionNoiseL2Loss=0.7512
+ throughput/total_tokens=11,712,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=62/500000]
+ train/ActionNoiseL2Loss=0.6137
+ throughput/total_tokens=11,904,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=63/500000]
+ train/ActionNoiseL2Loss=0.6707
+ throughput/total_tokens=12,096,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=64/500000]
+ train/ActionNoiseL2Loss=0.6804
+ throughput/total_tokens=12,288,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=65/500000]
+ train/ActionNoiseL2Loss=0.7190
+ throughput/total_tokens=12,480,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=66/500000]
+ train/ActionNoiseL2Loss=0.6716
+ throughput/total_tokens=12,672,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=67/500000]
+ train/ActionNoiseL2Loss=0.5929
+ throughput/total_tokens=12,864,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=68/500000]
+ train/ActionNoiseL2Loss=0.6193
+ throughput/total_tokens=13,056,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=69/500000]
+ train/ActionNoiseL2Loss=0.5472
+ throughput/total_tokens=13,248,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=70/500000]
+ train/ActionNoiseL2Loss=0.4597
+ throughput/total_tokens=13,440,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=71/500000]
+ train/ActionNoiseL2Loss=0.6054
+ throughput/total_tokens=13,632,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=72/500000]
+ train/ActionNoiseL2Loss=0.7331
+ throughput/total_tokens=13,824,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=73/500000]
+ train/ActionNoiseL2Loss=0.5427
+ throughput/total_tokens=14,016,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=74/500000]
+ train/ActionNoiseL2Loss=0.5637
+ throughput/total_tokens=14,208,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=75/500000]
+ train/ActionNoiseL2Loss=0.5477
+ throughput/total_tokens=14,400,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=76/500000]
+ train/ActionNoiseL2Loss=0.5682
+ throughput/total_tokens=14,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=77/500000]
+ train/ActionNoiseL2Loss=0.4869
+ throughput/total_tokens=14,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=78/500000]
+ train/ActionNoiseL2Loss=0.6201
+ throughput/total_tokens=14,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=79/500000]
+ train/ActionNoiseL2Loss=0.5627
+ throughput/total_tokens=15,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=80/500000]
+ optim/total_grad_norm=9.329
+ train/ActionNoiseL2Loss=0.5174
+ throughput/total_tokens=15,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=81/500000]
+ train/ActionNoiseL2Loss=0.5702
+ throughput/total_tokens=15,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=82/500000]
+ train/ActionNoiseL2Loss=0.4655
+ throughput/total_tokens=15,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=83/500000]
+ train/ActionNoiseL2Loss=0.5569
+ throughput/total_tokens=15,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=84/500000]
+ train/ActionNoiseL2Loss=0.4732
+ throughput/total_tokens=16,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=85/500000]
+ train/ActionNoiseL2Loss=0.6516
+ throughput/total_tokens=16,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=86/500000]
+ train/ActionNoiseL2Loss=0.4406
+ throughput/total_tokens=16,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=87/500000]
+ train/ActionNoiseL2Loss=0.4973
+ throughput/total_tokens=16,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=88/500000]
+ train/ActionNoiseL2Loss=0.5047
+ throughput/total_tokens=16,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=89/500000]
+ train/ActionNoiseL2Loss=0.4724
+ throughput/total_tokens=17,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=90/500000]
+ train/ActionNoiseL2Loss=0.4246
+ throughput/total_tokens=17,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=91/500000]
+ train/ActionNoiseL2Loss=0.4943
+ throughput/total_tokens=17,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=92/500000]
+ train/ActionNoiseL2Loss=0.4381
+ throughput/total_tokens=17,664,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=93/500000]
+ train/ActionNoiseL2Loss=0.3797
+ throughput/total_tokens=17,856,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=94/500000]
+ train/ActionNoiseL2Loss=0.4715
+ throughput/total_tokens=18,048,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=95/500000]
+ train/ActionNoiseL2Loss=0.4033
+ throughput/total_tokens=18,240,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=96/500000]
+ train/ActionNoiseL2Loss=0.3655
+ throughput/total_tokens=18,432,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=97/500000]
+ train/ActionNoiseL2Loss=0.3512
+ throughput/total_tokens=18,624,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=98/500000]
+ train/ActionNoiseL2Loss=0.4246
+ throughput/total_tokens=18,816,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=99/500000]
+ train/ActionNoiseL2Loss=0.3381
+ throughput/total_tokens=19,008,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=100/500000]
+ optim/total_grad_norm=8.408
+ train/ActionNoiseL2Loss=0.4161
+ throughput/total_tokens=19,200,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=101/500000]
+ train/ActionNoiseL2Loss=0.4288
+ throughput/total_tokens=19,392,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=102/500000]
+ train/ActionNoiseL2Loss=0.3854
+ throughput/total_tokens=19,584,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=103/500000]
+ train/ActionNoiseL2Loss=0.3170
+ throughput/total_tokens=19,776,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=104/500000]
+ train/ActionNoiseL2Loss=0.3385
+ throughput/total_tokens=19,968,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=105/500000]
+ train/ActionNoiseL2Loss=0.3698
+ throughput/total_tokens=20,160,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=106/500000]
+ train/ActionNoiseL2Loss=0.3064
+ throughput/total_tokens=20,352,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=107/500000]
+ train/ActionNoiseL2Loss=0.3116
+ throughput/total_tokens=20,544,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=108/500000]
+ train/ActionNoiseL2Loss=0.3547
+ throughput/total_tokens=20,736,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=109/500000]
+ train/ActionNoiseL2Loss=0.3379
+ throughput/total_tokens=20,928,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=110/500000]
+ train/ActionNoiseL2Loss=0.2224
+ throughput/total_tokens=21,120,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,073
+[step=111/500000]
+ train/ActionNoiseL2Loss=0.2550
+ throughput/total_tokens=21,312,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=112/500000]
+ train/ActionNoiseL2Loss=0.4382
+ throughput/total_tokens=21,504,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=113/500000]
+ train/ActionNoiseL2Loss=0.2271
+ throughput/total_tokens=21,696,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=114/500000]
+ train/ActionNoiseL2Loss=0.4280
+ throughput/total_tokens=21,888,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=115/500000]
+ train/ActionNoiseL2Loss=0.3731
+ throughput/total_tokens=22,080,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=116/500000]
+ train/ActionNoiseL2Loss=0.2528
+ throughput/total_tokens=22,272,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=117/500000]
+ train/ActionNoiseL2Loss=0.2784
+ throughput/total_tokens=22,464,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=118/500000]
+ train/ActionNoiseL2Loss=0.3613
+ throughput/total_tokens=22,656,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=119/500000]
+ train/ActionNoiseL2Loss=0.3111
+ throughput/total_tokens=22,848,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=120/500000]
+ optim/total_grad_norm=11.88
+ train/ActionNoiseL2Loss=0.3579
+ throughput/total_tokens=23,040,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=121/500000]
+ train/ActionNoiseL2Loss=0.2597
+ throughput/total_tokens=23,232,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=122/500000]
+ train/ActionNoiseL2Loss=0.3144
+ throughput/total_tokens=23,424,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=123/500000]
+ train/ActionNoiseL2Loss=0.3832
+ throughput/total_tokens=23,616,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=124/500000]
+ train/ActionNoiseL2Loss=0.3736
+ throughput/total_tokens=23,808,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=125/500000]
+ train/ActionNoiseL2Loss=0.2168
+ throughput/total_tokens=24,000,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=126/500000]
+ train/ActionNoiseL2Loss=0.3654
+ throughput/total_tokens=24,192,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=127/500000]
+ train/ActionNoiseL2Loss=0.2379
+ throughput/total_tokens=24,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=128/500000]
+ train/ActionNoiseL2Loss=0.4401
+ throughput/total_tokens=24,576,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=129/500000]
+ train/ActionNoiseL2Loss=0.2832
+ throughput/total_tokens=24,768,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=130/500000]
+ train/ActionNoiseL2Loss=0.2097
+ throughput/total_tokens=24,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=131/500000]
+ train/ActionNoiseL2Loss=0.3758
+ throughput/total_tokens=25,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=132/500000]
+ train/ActionNoiseL2Loss=0.2539
+ throughput/total_tokens=25,344,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=133/500000]
+ train/ActionNoiseL2Loss=0.3685
+ throughput/total_tokens=25,536,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=134/500000]
+ train/ActionNoiseL2Loss=0.2691
+ throughput/total_tokens=25,728,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=135/500000]
+ train/ActionNoiseL2Loss=0.2767
+ throughput/total_tokens=25,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=136/500000]
+ train/ActionNoiseL2Loss=0.3033
+ throughput/total_tokens=26,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=137/500000]
+ train/ActionNoiseL2Loss=0.3303
+ throughput/total_tokens=26,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=138/500000]
+ train/ActionNoiseL2Loss=0.3087
+ throughput/total_tokens=26,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=139/500000]
+ train/ActionNoiseL2Loss=0.2561
+ throughput/total_tokens=26,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=140/500000]
+ optim/total_grad_norm=10.48
+ train/ActionNoiseL2Loss=0.3034
+ throughput/total_tokens=26,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=141/500000]
+ train/ActionNoiseL2Loss=0.2055
+ throughput/total_tokens=27,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=142/500000]
+ train/ActionNoiseL2Loss=0.2397
+ throughput/total_tokens=27,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=143/500000]
+ train/ActionNoiseL2Loss=0.2364
+ throughput/total_tokens=27,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=144/500000]
+ train/ActionNoiseL2Loss=0.2615
+ throughput/total_tokens=27,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=145/500000]
+ train/ActionNoiseL2Loss=0.3684
+ throughput/total_tokens=27,840,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=146/500000]
+ train/ActionNoiseL2Loss=0.3662
+ throughput/total_tokens=28,032,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=147/500000]
+ train/ActionNoiseL2Loss=0.1978
+ throughput/total_tokens=28,224,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=148/500000]
+ train/ActionNoiseL2Loss=0.1766
+ throughput/total_tokens=28,416,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=149/500000]
+ train/ActionNoiseL2Loss=0.2487
+ throughput/total_tokens=28,608,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=150/500000]
+ train/ActionNoiseL2Loss=0.2450
+ throughput/total_tokens=28,800,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=151/500000]
+ train/ActionNoiseL2Loss=0.2397
+ throughput/total_tokens=28,992,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=152/500000]
+ train/ActionNoiseL2Loss=0.3776
+ throughput/total_tokens=29,184,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=153/500000]
+ train/ActionNoiseL2Loss=0.3363
+ throughput/total_tokens=29,376,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=154/500000]
+ train/ActionNoiseL2Loss=0.2345
+ throughput/total_tokens=29,568,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=155/500000]
+ train/ActionNoiseL2Loss=0.3231
+ throughput/total_tokens=29,760,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=156/500000]
+ train/ActionNoiseL2Loss=0.2246
+ throughput/total_tokens=29,952,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=157/500000]
+ train/ActionNoiseL2Loss=0.3735
+ throughput/total_tokens=30,144,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=158/500000]
+ train/ActionNoiseL2Loss=0.2048
+ throughput/total_tokens=30,336,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=159/500000]
+ train/ActionNoiseL2Loss=0.1897
+ throughput/total_tokens=30,528,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=160/500000]
+ optim/total_grad_norm=9.192
+ train/ActionNoiseL2Loss=0.3285
+ throughput/total_tokens=30,720,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,073
+[step=161/500000]
+ train/ActionNoiseL2Loss=0.3166
+ throughput/total_tokens=30,912,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=162/500000]
+ train/ActionNoiseL2Loss=0.1985
+ throughput/total_tokens=31,104,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=163/500000]
+ train/ActionNoiseL2Loss=0.2286
+ throughput/total_tokens=31,296,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=164/500000]
+ train/ActionNoiseL2Loss=0.2763
+ throughput/total_tokens=31,488,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=165/500000]
+ train/ActionNoiseL2Loss=0.3157
+ throughput/total_tokens=31,680,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=166/500000]
+ train/ActionNoiseL2Loss=0.2681
+ throughput/total_tokens=31,872,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=167/500000]
+ train/ActionNoiseL2Loss=0.2437
+ throughput/total_tokens=32,064,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=168/500000]
+ train/ActionNoiseL2Loss=0.3316
+ throughput/total_tokens=32,256,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=169/500000]
+ train/ActionNoiseL2Loss=0.2685
+ throughput/total_tokens=32,448,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=170/500000]
+ train/ActionNoiseL2Loss=0.2466
+ throughput/total_tokens=32,640,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=171/500000]
+ train/ActionNoiseL2Loss=0.2722
+ throughput/total_tokens=32,832,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=172/500000]
+ train/ActionNoiseL2Loss=0.1813
+ throughput/total_tokens=33,024,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=173/500000]
+ train/ActionNoiseL2Loss=0.2004
+ throughput/total_tokens=33,216,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=174/500000]
+ train/ActionNoiseL2Loss=0.2873
+ throughput/total_tokens=33,408,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=175/500000]
+ train/ActionNoiseL2Loss=0.3610
+ throughput/total_tokens=33,600,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=176/500000]
+ train/ActionNoiseL2Loss=0.2323
+ throughput/total_tokens=33,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=177/500000]
+ train/ActionNoiseL2Loss=0.2687
+ throughput/total_tokens=33,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=178/500000]
+ train/ActionNoiseL2Loss=0.4066
+ throughput/total_tokens=34,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=179/500000]
+ train/ActionNoiseL2Loss=0.2733
+ throughput/total_tokens=34,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=180/500000]
+ optim/total_grad_norm=5.450
+ train/ActionNoiseL2Loss=0.1830
+ throughput/total_tokens=34,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=181/500000]
+ train/ActionNoiseL2Loss=0.2056
+ throughput/total_tokens=34,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=182/500000]
+ train/ActionNoiseL2Loss=0.2547
+ throughput/total_tokens=34,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=183/500000]
+ train/ActionNoiseL2Loss=0.2606
+ throughput/total_tokens=35,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=184/500000]
+ train/ActionNoiseL2Loss=0.3030
+ throughput/total_tokens=35,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=185/500000]
+ train/ActionNoiseL2Loss=0.2967
+ throughput/total_tokens=35,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=186/500000]
+ train/ActionNoiseL2Loss=0.2276
+ throughput/total_tokens=35,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=187/500000]
+ train/ActionNoiseL2Loss=0.1799
+ throughput/total_tokens=35,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=188/500000]
+ train/ActionNoiseL2Loss=0.2635
+ throughput/total_tokens=36,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=189/500000]
+ train/ActionNoiseL2Loss=0.3928
+ throughput/total_tokens=36,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=190/500000]
+ train/ActionNoiseL2Loss=0.1769
+ throughput/total_tokens=36,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=191/500000]
+ train/ActionNoiseL2Loss=0.2123
+ throughput/total_tokens=36,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=192/500000]
+ train/ActionNoiseL2Loss=0.1957
+ throughput/total_tokens=36,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=193/500000]
+ train/ActionNoiseL2Loss=0.1835
+ throughput/total_tokens=37,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=194/500000]
+ train/ActionNoiseL2Loss=0.2724
+ throughput/total_tokens=37,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=195/500000]
+ train/ActionNoiseL2Loss=0.2827
+ throughput/total_tokens=37,440,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=196/500000]
+ train/ActionNoiseL2Loss=0.1847
+ throughput/total_tokens=37,632,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=197/500000]
+ train/ActionNoiseL2Loss=0.2531
+ throughput/total_tokens=37,824,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=198/500000]
+ train/ActionNoiseL2Loss=0.1785
+ throughput/total_tokens=38,016,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=199/500000]
+ train/ActionNoiseL2Loss=0.1968
+ throughput/total_tokens=38,208,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=200/500000]
+ optim/total_grad_norm=5.479
+ train/ActionNoiseL2Loss=0.1835
+ throughput/total_tokens=38,400,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=201/500000]
+ train/ActionNoiseL2Loss=0.1840
+ throughput/total_tokens=38,592,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=202/500000]
+ train/ActionNoiseL2Loss=0.3384
+ throughput/total_tokens=38,784,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=203/500000]
+ train/ActionNoiseL2Loss=0.2128
+ throughput/total_tokens=38,976,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=204/500000]
+ train/ActionNoiseL2Loss=0.2124
+ throughput/total_tokens=39,168,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=205/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=39,360,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=206/500000]
+ train/ActionNoiseL2Loss=0.1875
+ throughput/total_tokens=39,552,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=207/500000]
+ train/ActionNoiseL2Loss=0.2854
+ throughput/total_tokens=39,744,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=208/500000]
+ train/ActionNoiseL2Loss=0.2597
+ throughput/total_tokens=39,936,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=209/500000]
+ train/ActionNoiseL2Loss=0.2471
+ throughput/total_tokens=40,128,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=210/500000]
+ train/ActionNoiseL2Loss=0.2043
+ throughput/total_tokens=40,320,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=211/500000]
+ train/ActionNoiseL2Loss=0.3694
+ throughput/total_tokens=40,512,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=212/500000]
+ train/ActionNoiseL2Loss=0.2468
+ throughput/total_tokens=40,704,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=213/500000]
+ train/ActionNoiseL2Loss=0.2491
+ throughput/total_tokens=40,896,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=214/500000]
+ train/ActionNoiseL2Loss=0.2010
+ throughput/total_tokens=41,088,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=215/500000]
+ train/ActionNoiseL2Loss=0.2743
+ throughput/total_tokens=41,280,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=216/500000]
+ train/ActionNoiseL2Loss=0.3207
+ throughput/total_tokens=41,472,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=217/500000]
+ train/ActionNoiseL2Loss=0.1929
+ throughput/total_tokens=41,664,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=218/500000]
+ train/ActionNoiseL2Loss=0.2676
+ throughput/total_tokens=41,856,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=219/500000]
+ train/ActionNoiseL2Loss=0.2626
+ throughput/total_tokens=42,048,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=220/500000]
+ optim/total_grad_norm=9.466
+ train/ActionNoiseL2Loss=0.3485
+ throughput/total_tokens=42,240,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=221/500000]
+ train/ActionNoiseL2Loss=0.1883
+ throughput/total_tokens=42,432,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=222/500000]
+ train/ActionNoiseL2Loss=0.2335
+ throughput/total_tokens=42,624,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=223/500000]
+ train/ActionNoiseL2Loss=0.1990
+ throughput/total_tokens=42,816,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=224/500000]
+ train/ActionNoiseL2Loss=0.1495
+ throughput/total_tokens=43,008,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=225/500000]
+ train/ActionNoiseL2Loss=0.2343
+ throughput/total_tokens=43,200,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=226/500000]
+ train/ActionNoiseL2Loss=0.3354
+ throughput/total_tokens=43,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=227/500000]
+ train/ActionNoiseL2Loss=0.2947
+ throughput/total_tokens=43,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=228/500000]
+ train/ActionNoiseL2Loss=0.2569
+ throughput/total_tokens=43,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=229/500000]
+ train/ActionNoiseL2Loss=0.3221
+ throughput/total_tokens=43,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=230/500000]
+ train/ActionNoiseL2Loss=0.2014
+ throughput/total_tokens=44,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=231/500000]
+ train/ActionNoiseL2Loss=0.3001
+ throughput/total_tokens=44,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=232/500000]
+ train/ActionNoiseL2Loss=0.2575
+ throughput/total_tokens=44,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=233/500000]
+ train/ActionNoiseL2Loss=0.1880
+ throughput/total_tokens=44,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=234/500000]
+ train/ActionNoiseL2Loss=0.2439
+ throughput/total_tokens=44,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=235/500000]
+ train/ActionNoiseL2Loss=0.3030
+ throughput/total_tokens=45,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=236/500000]
+ train/ActionNoiseL2Loss=0.2480
+ throughput/total_tokens=45,312,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=237/500000]
+ train/ActionNoiseL2Loss=0.2056
+ throughput/total_tokens=45,504,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=238/500000]
+ train/ActionNoiseL2Loss=0.1969
+ throughput/total_tokens=45,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=239/500000]
+ train/ActionNoiseL2Loss=0.1694
+ throughput/total_tokens=45,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=240/500000]
+ optim/total_grad_norm=10.07
+ train/ActionNoiseL2Loss=0.2776
+ throughput/total_tokens=46,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=241/500000]
+ train/ActionNoiseL2Loss=0.2455
+ throughput/total_tokens=46,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=242/500000]
+ train/ActionNoiseL2Loss=0.3220
+ throughput/total_tokens=46,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=243/500000]
+ train/ActionNoiseL2Loss=0.2572
+ throughput/total_tokens=46,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=244/500000]
+ train/ActionNoiseL2Loss=0.2453
+ throughput/total_tokens=46,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=245/500000]
+ train/ActionNoiseL2Loss=0.2105
+ throughput/total_tokens=47,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=246/500000]
+ train/ActionNoiseL2Loss=0.1987
+ throughput/total_tokens=47,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=247/500000]
+ train/ActionNoiseL2Loss=0.2762
+ throughput/total_tokens=47,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=248/500000]
+ train/ActionNoiseL2Loss=0.2042
+ throughput/total_tokens=47,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=249/500000]
+ train/ActionNoiseL2Loss=0.2733
+ throughput/total_tokens=47,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=250/500000]
+ train/ActionNoiseL2Loss=0.1469
+ throughput/total_tokens=48,000,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=251/500000]
+ train/ActionNoiseL2Loss=0.1617
+ throughput/total_tokens=48,192,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=252/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=48,384,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=253/500000]
+ train/ActionNoiseL2Loss=0.2222
+ throughput/total_tokens=48,576,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=254/500000]
+ train/ActionNoiseL2Loss=0.1852
+ throughput/total_tokens=48,768,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=255/500000]
+ train/ActionNoiseL2Loss=0.1409
+ throughput/total_tokens=48,960,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=256/500000]
+ train/ActionNoiseL2Loss=0.2720
+ throughput/total_tokens=49,152,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=257/500000]
+ train/ActionNoiseL2Loss=0.1572
+ throughput/total_tokens=49,344,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=258/500000]
+ train/ActionNoiseL2Loss=0.1860
+ throughput/total_tokens=49,536,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=259/500000]
+ train/ActionNoiseL2Loss=0.2794
+ throughput/total_tokens=49,728,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=260/500000]
+ optim/total_grad_norm=8.083
+ train/ActionNoiseL2Loss=0.3206
+ throughput/total_tokens=49,920,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,073
+[step=261/500000]
+ train/ActionNoiseL2Loss=0.2065
+ throughput/total_tokens=50,112,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=262/500000]
+ train/ActionNoiseL2Loss=0.2290
+ throughput/total_tokens=50,304,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=263/500000]
+ train/ActionNoiseL2Loss=0.2418
+ throughput/total_tokens=50,496,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=264/500000]
+ train/ActionNoiseL2Loss=0.2465
+ throughput/total_tokens=50,688,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=265/500000]
+ train/ActionNoiseL2Loss=0.3132
+ throughput/total_tokens=50,880,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=266/500000]
+ train/ActionNoiseL2Loss=0.2118
+ throughput/total_tokens=51,072,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=267/500000]
+ train/ActionNoiseL2Loss=0.2233
+ throughput/total_tokens=51,264,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=268/500000]
+ train/ActionNoiseL2Loss=0.2285
+ throughput/total_tokens=51,456,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=269/500000]
+ train/ActionNoiseL2Loss=0.2560
+ throughput/total_tokens=51,648,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=270/500000]
+ train/ActionNoiseL2Loss=0.2125
+ throughput/total_tokens=51,840,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=271/500000]
+ train/ActionNoiseL2Loss=0.2210
+ throughput/total_tokens=52,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=272/500000]
+ train/ActionNoiseL2Loss=0.2319
+ throughput/total_tokens=52,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=273/500000]
+ train/ActionNoiseL2Loss=0.2696
+ throughput/total_tokens=52,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=274/500000]
+ train/ActionNoiseL2Loss=0.2098
+ throughput/total_tokens=52,608,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=275/500000]
+ train/ActionNoiseL2Loss=0.1589
+ throughput/total_tokens=52,800,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=276/500000]
+ train/ActionNoiseL2Loss=0.2310
+ throughput/total_tokens=52,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=277/500000]
+ train/ActionNoiseL2Loss=0.2856
+ throughput/total_tokens=53,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=278/500000]
+ train/ActionNoiseL2Loss=0.2405
+ throughput/total_tokens=53,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=279/500000]
+ train/ActionNoiseL2Loss=0.2688
+ throughput/total_tokens=53,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=280/500000]
+ optim/total_grad_norm=11.82
+ train/ActionNoiseL2Loss=0.2380
+ throughput/total_tokens=53,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=281/500000]
+ train/ActionNoiseL2Loss=0.2600
+ throughput/total_tokens=53,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=282/500000]
+ train/ActionNoiseL2Loss=0.3106
+ throughput/total_tokens=54,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=283/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=54,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=284/500000]
+ train/ActionNoiseL2Loss=0.2178
+ throughput/total_tokens=54,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=285/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=54,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=286/500000]
+ train/ActionNoiseL2Loss=0.2496
+ throughput/total_tokens=54,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=287/500000]
+ train/ActionNoiseL2Loss=0.2460
+ throughput/total_tokens=55,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=288/500000]
+ train/ActionNoiseL2Loss=0.2654
+ throughput/total_tokens=55,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=289/500000]
+ train/ActionNoiseL2Loss=0.3097
+ throughput/total_tokens=55,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=290/500000]
+ train/ActionNoiseL2Loss=0.2140
+ throughput/total_tokens=55,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=291/500000]
+ train/ActionNoiseL2Loss=0.2327
+ throughput/total_tokens=55,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=292/500000]
+ train/ActionNoiseL2Loss=0.1976
+ throughput/total_tokens=56,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=293/500000]
+ train/ActionNoiseL2Loss=0.2533
+ throughput/total_tokens=56,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=294/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=56,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=295/500000]
+ train/ActionNoiseL2Loss=0.1351
+ throughput/total_tokens=56,640,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=296/500000]
+ train/ActionNoiseL2Loss=0.1580
+ throughput/total_tokens=56,832,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=297/500000]
+ train/ActionNoiseL2Loss=0.2327
+ throughput/total_tokens=57,024,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=298/500000]
+ train/ActionNoiseL2Loss=0.2394
+ throughput/total_tokens=57,216,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=299/500000]
+ train/ActionNoiseL2Loss=0.1403
+ throughput/total_tokens=57,408,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=300/500000]
+ optim/total_grad_norm=8.930
+ train/ActionNoiseL2Loss=0.3429
+ throughput/total_tokens=57,600,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=301/500000]
+ train/ActionNoiseL2Loss=0.2080
+ throughput/total_tokens=57,792,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=302/500000]
+ train/ActionNoiseL2Loss=0.1749
+ throughput/total_tokens=57,984,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=303/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=58,176,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=304/500000]
+ train/ActionNoiseL2Loss=0.2321
+ throughput/total_tokens=58,368,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=305/500000]
+ train/ActionNoiseL2Loss=0.2181
+ throughput/total_tokens=58,560,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=306/500000]
+ train/ActionNoiseL2Loss=0.2800
+ throughput/total_tokens=58,752,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=307/500000]
+ train/ActionNoiseL2Loss=0.2758
+ throughput/total_tokens=58,944,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=308/500000]
+ train/ActionNoiseL2Loss=0.2539
+ throughput/total_tokens=59,136,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=309/500000]
+ train/ActionNoiseL2Loss=0.1728
+ throughput/total_tokens=59,328,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=310/500000]
+ train/ActionNoiseL2Loss=0.2298
+ throughput/total_tokens=59,520,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,073
+[step=311/500000]
+ train/ActionNoiseL2Loss=0.1773
+ throughput/total_tokens=59,712,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=312/500000]
+ train/ActionNoiseL2Loss=0.2068
+ throughput/total_tokens=59,904,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=313/500000]
+ train/ActionNoiseL2Loss=0.2327
+ throughput/total_tokens=60,096,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=314/500000]
+ train/ActionNoiseL2Loss=0.2109
+ throughput/total_tokens=60,288,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=315/500000]
+ train/ActionNoiseL2Loss=0.2001
+ throughput/total_tokens=60,480,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=316/500000]
+ train/ActionNoiseL2Loss=0.1682
+ throughput/total_tokens=60,672,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=317/500000]
+ train/ActionNoiseL2Loss=0.2000
+ throughput/total_tokens=60,864,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=318/500000]
+ train/ActionNoiseL2Loss=0.1912
+ throughput/total_tokens=61,056,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=319/500000]
+ train/ActionNoiseL2Loss=0.2066
+ throughput/total_tokens=61,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=320/500000]
+ optim/total_grad_norm=3.601
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=61,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=321/500000]
+ train/ActionNoiseL2Loss=0.1727
+ throughput/total_tokens=61,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=322/500000]
+ train/ActionNoiseL2Loss=0.3112
+ throughput/total_tokens=61,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=323/500000]
+ train/ActionNoiseL2Loss=0.2546
+ throughput/total_tokens=62,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=324/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=62,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=325/500000]
+ train/ActionNoiseL2Loss=0.3044
+ throughput/total_tokens=62,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=326/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=62,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=327/500000]
+ train/ActionNoiseL2Loss=0.2338
+ throughput/total_tokens=62,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=328/500000]
+ train/ActionNoiseL2Loss=0.2085
+ throughput/total_tokens=62,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=329/500000]
+ train/ActionNoiseL2Loss=0.1952
+ throughput/total_tokens=63,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=330/500000]
+ train/ActionNoiseL2Loss=0.2354
+ throughput/total_tokens=63,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=331/500000]
+ train/ActionNoiseL2Loss=0.1540
+ throughput/total_tokens=63,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=332/500000]
+ train/ActionNoiseL2Loss=0.1559
+ throughput/total_tokens=63,744,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=333/500000]
+ train/ActionNoiseL2Loss=0.1756
+ throughput/total_tokens=63,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=334/500000]
+ train/ActionNoiseL2Loss=0.1632
+ throughput/total_tokens=64,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=335/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=64,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=336/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=64,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=337/500000]
+ train/ActionNoiseL2Loss=0.2781
+ throughput/total_tokens=64,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=338/500000]
+ train/ActionNoiseL2Loss=0.3489
+ throughput/total_tokens=64,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=339/500000]
+ train/ActionNoiseL2Loss=0.2848
+ throughput/total_tokens=65,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=340/500000]
+ optim/total_grad_norm=5.420
+ train/ActionNoiseL2Loss=0.1481
+ throughput/total_tokens=65,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=341/500000]
+ train/ActionNoiseL2Loss=0.2688
+ throughput/total_tokens=65,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=342/500000]
+ train/ActionNoiseL2Loss=0.2809
+ throughput/total_tokens=65,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=343/500000]
+ train/ActionNoiseL2Loss=0.2123
+ throughput/total_tokens=65,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=344/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=66,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=345/500000]
+ train/ActionNoiseL2Loss=0.2867
+ throughput/total_tokens=66,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=346/500000]
+ train/ActionNoiseL2Loss=0.1835
+ throughput/total_tokens=66,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=347/500000]
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=66,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=348/500000]
+ train/ActionNoiseL2Loss=0.1792
+ throughput/total_tokens=66,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=349/500000]
+ train/ActionNoiseL2Loss=0.3523
+ throughput/total_tokens=67,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=350/500000]
+ train/ActionNoiseL2Loss=0.1980
+ throughput/total_tokens=67,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=351/500000]
+ train/ActionNoiseL2Loss=0.2031
+ throughput/total_tokens=67,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=352/500000]
+ train/ActionNoiseL2Loss=0.2141
+ throughput/total_tokens=67,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=353/500000]
+ train/ActionNoiseL2Loss=0.2112
+ throughput/total_tokens=67,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=354/500000]
+ train/ActionNoiseL2Loss=0.1769
+ throughput/total_tokens=67,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=355/500000]
+ train/ActionNoiseL2Loss=0.2188
+ throughput/total_tokens=68,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=356/500000]
+ train/ActionNoiseL2Loss=0.2647
+ throughput/total_tokens=68,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=357/500000]
+ train/ActionNoiseL2Loss=0.2216
+ throughput/total_tokens=68,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=358/500000]
+ train/ActionNoiseL2Loss=0.2650
+ throughput/total_tokens=68,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=359/500000]
+ train/ActionNoiseL2Loss=0.1240
+ throughput/total_tokens=68,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=360/500000]
+ optim/total_grad_norm=4.749
+ train/ActionNoiseL2Loss=0.1916
+ throughput/total_tokens=69,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=361/500000]
+ train/ActionNoiseL2Loss=0.1367
+ throughput/total_tokens=69,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=362/500000]
+ train/ActionNoiseL2Loss=0.2858
+ throughput/total_tokens=69,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=363/500000]
+ train/ActionNoiseL2Loss=0.1951
+ throughput/total_tokens=69,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=364/500000]
+ train/ActionNoiseL2Loss=0.2194
+ throughput/total_tokens=69,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=365/500000]
+ train/ActionNoiseL2Loss=0.1941
+ throughput/total_tokens=70,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=366/500000]
+ train/ActionNoiseL2Loss=0.1681
+ throughput/total_tokens=70,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=367/500000]
+ train/ActionNoiseL2Loss=0.2233
+ throughput/total_tokens=70,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=368/500000]
+ train/ActionNoiseL2Loss=0.1674
+ throughput/total_tokens=70,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=369/500000]
+ train/ActionNoiseL2Loss=0.1817
+ throughput/total_tokens=70,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=370/500000]
+ train/ActionNoiseL2Loss=0.1827
+ throughput/total_tokens=71,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=371/500000]
+ train/ActionNoiseL2Loss=0.1774
+ throughput/total_tokens=71,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=372/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=71,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=373/500000]
+ train/ActionNoiseL2Loss=0.1640
+ throughput/total_tokens=71,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=374/500000]
+ train/ActionNoiseL2Loss=0.2788
+ throughput/total_tokens=71,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=375/500000]
+ train/ActionNoiseL2Loss=0.2013
+ throughput/total_tokens=72,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=376/500000]
+ train/ActionNoiseL2Loss=0.1504
+ throughput/total_tokens=72,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=377/500000]
+ train/ActionNoiseL2Loss=0.2573
+ throughput/total_tokens=72,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=378/500000]
+ train/ActionNoiseL2Loss=0.1806
+ throughput/total_tokens=72,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=379/500000]
+ train/ActionNoiseL2Loss=0.2191
+ throughput/total_tokens=72,768,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=380/500000]
+ optim/total_grad_norm=5.655
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=72,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=381/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=73,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=382/500000]
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=73,344,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=383/500000]
+ train/ActionNoiseL2Loss=0.3361
+ throughput/total_tokens=73,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=384/500000]
+ train/ActionNoiseL2Loss=0.2426
+ throughput/total_tokens=73,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=385/500000]
+ train/ActionNoiseL2Loss=0.1675
+ throughput/total_tokens=73,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=386/500000]
+ train/ActionNoiseL2Loss=0.2598
+ throughput/total_tokens=74,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=387/500000]
+ train/ActionNoiseL2Loss=0.1730
+ throughput/total_tokens=74,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=388/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=74,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=389/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=74,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=390/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=74,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=391/500000]
+ train/ActionNoiseL2Loss=0.2546
+ throughput/total_tokens=75,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=392/500000]
+ train/ActionNoiseL2Loss=0.1723
+ throughput/total_tokens=75,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=393/500000]
+ train/ActionNoiseL2Loss=0.1620
+ throughput/total_tokens=75,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=394/500000]
+ train/ActionNoiseL2Loss=0.1621
+ throughput/total_tokens=75,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=395/500000]
+ train/ActionNoiseL2Loss=0.2363
+ throughput/total_tokens=75,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=396/500000]
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=76,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=397/500000]
+ train/ActionNoiseL2Loss=0.2378
+ throughput/total_tokens=76,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=398/500000]
+ train/ActionNoiseL2Loss=0.1829
+ throughput/total_tokens=76,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=399/500000]
+ train/ActionNoiseL2Loss=0.1711
+ throughput/total_tokens=76,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=400/500000]
+ optim/total_grad_norm=5.119
+ train/ActionNoiseL2Loss=0.2104
+ throughput/total_tokens=76,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=401/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=76,992,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=402/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=77,184,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=403/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=77,376,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=404/500000]
+ train/ActionNoiseL2Loss=0.1874
+ throughput/total_tokens=77,568,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=405/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=77,760,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=406/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=77,952,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=407/500000]
+ train/ActionNoiseL2Loss=0.1617
+ throughput/total_tokens=78,144,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=408/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=78,336,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=409/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=78,528,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=410/500000]
+ train/ActionNoiseL2Loss=0.2449
+ throughput/total_tokens=78,720,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=411/500000]
+ train/ActionNoiseL2Loss=0.1917
+ throughput/total_tokens=78,912,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=412/500000]
+ train/ActionNoiseL2Loss=0.2427
+ throughput/total_tokens=79,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=413/500000]
+ train/ActionNoiseL2Loss=0.2062
+ throughput/total_tokens=79,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=414/500000]
+ train/ActionNoiseL2Loss=0.2036
+ throughput/total_tokens=79,488,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=415/500000]
+ train/ActionNoiseL2Loss=0.1851
+ throughput/total_tokens=79,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=416/500000]
+ train/ActionNoiseL2Loss=0.2119
+ throughput/total_tokens=79,872,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=417/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=80,064,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=418/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=80,256,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=419/500000]
+ train/ActionNoiseL2Loss=0.2105
+ throughput/total_tokens=80,448,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=420/500000]
+ optim/total_grad_norm=7.806
+ train/ActionNoiseL2Loss=0.2744
+ throughput/total_tokens=80,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=421/500000]
+ train/ActionNoiseL2Loss=0.2487
+ throughput/total_tokens=80,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=422/500000]
+ train/ActionNoiseL2Loss=0.1745
+ throughput/total_tokens=81,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=423/500000]
+ train/ActionNoiseL2Loss=0.1720
+ throughput/total_tokens=81,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=424/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=81,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=425/500000]
+ train/ActionNoiseL2Loss=0.2078
+ throughput/total_tokens=81,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=426/500000]
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=81,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=427/500000]
+ train/ActionNoiseL2Loss=0.2094
+ throughput/total_tokens=81,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=428/500000]
+ train/ActionNoiseL2Loss=0.1700
+ throughput/total_tokens=82,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=429/500000]
+ train/ActionNoiseL2Loss=0.2207
+ throughput/total_tokens=82,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=430/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=82,560,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=431/500000]
+ train/ActionNoiseL2Loss=0.1620
+ throughput/total_tokens=82,752,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=432/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=82,944,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=433/500000]
+ train/ActionNoiseL2Loss=0.1681
+ throughput/total_tokens=83,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=434/500000]
+ train/ActionNoiseL2Loss=0.1464
+ throughput/total_tokens=83,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=435/500000]
+ train/ActionNoiseL2Loss=0.1513
+ throughput/total_tokens=83,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=436/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=83,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=437/500000]
+ train/ActionNoiseL2Loss=0.1913
+ throughput/total_tokens=83,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=438/500000]
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=84,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=439/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=84,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=440/500000]
+ optim/total_grad_norm=5.096
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=84,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=441/500000]
+ train/ActionNoiseL2Loss=0.1895
+ throughput/total_tokens=84,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=442/500000]
+ train/ActionNoiseL2Loss=0.1972
+ throughput/total_tokens=84,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=443/500000]
+ train/ActionNoiseL2Loss=0.2155
+ throughput/total_tokens=85,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=444/500000]
+ train/ActionNoiseL2Loss=0.1870
+ throughput/total_tokens=85,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=445/500000]
+ train/ActionNoiseL2Loss=0.2414
+ throughput/total_tokens=85,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=446/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=85,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=447/500000]
+ train/ActionNoiseL2Loss=0.2131
+ throughput/total_tokens=85,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=448/500000]
+ train/ActionNoiseL2Loss=0.1907
+ throughput/total_tokens=86,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=449/500000]
+ train/ActionNoiseL2Loss=0.2146
+ throughput/total_tokens=86,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=450/500000]
+ train/ActionNoiseL2Loss=0.1932
+ throughput/total_tokens=86,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=451/500000]
+ train/ActionNoiseL2Loss=0.2243
+ throughput/total_tokens=86,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=452/500000]
+ train/ActionNoiseL2Loss=0.1904
+ throughput/total_tokens=86,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=453/500000]
+ train/ActionNoiseL2Loss=0.3030
+ throughput/total_tokens=86,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=454/500000]
+ train/ActionNoiseL2Loss=0.1899
+ throughput/total_tokens=87,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=455/500000]
+ train/ActionNoiseL2Loss=0.2953
+ throughput/total_tokens=87,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=456/500000]
+ train/ActionNoiseL2Loss=0.2969
+ throughput/total_tokens=87,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=457/500000]
+ train/ActionNoiseL2Loss=0.2131
+ throughput/total_tokens=87,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=458/500000]
+ train/ActionNoiseL2Loss=0.2375
+ throughput/total_tokens=87,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=459/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=88,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=460/500000]
+ optim/total_grad_norm=6.416
+ train/ActionNoiseL2Loss=0.1888
+ throughput/total_tokens=88,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=461/500000]
+ train/ActionNoiseL2Loss=0.2208
+ throughput/total_tokens=88,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=462/500000]
+ train/ActionNoiseL2Loss=0.2369
+ throughput/total_tokens=88,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=463/500000]
+ train/ActionNoiseL2Loss=0.1935
+ throughput/total_tokens=88,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=464/500000]
+ train/ActionNoiseL2Loss=0.2068
+ throughput/total_tokens=89,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=465/500000]
+ train/ActionNoiseL2Loss=0.1551
+ throughput/total_tokens=89,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=466/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=89,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=467/500000]
+ train/ActionNoiseL2Loss=0.1527
+ throughput/total_tokens=89,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=468/500000]
+ train/ActionNoiseL2Loss=0.2638
+ throughput/total_tokens=89,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=469/500000]
+ train/ActionNoiseL2Loss=0.1584
+ throughput/total_tokens=90,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=470/500000]
+ train/ActionNoiseL2Loss=0.2211
+ throughput/total_tokens=90,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=471/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=90,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=472/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=90,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=473/500000]
+ train/ActionNoiseL2Loss=0.2066
+ throughput/total_tokens=90,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=474/500000]
+ train/ActionNoiseL2Loss=0.1657
+ throughput/total_tokens=91,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=475/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=91,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=476/500000]
+ train/ActionNoiseL2Loss=0.1742
+ throughput/total_tokens=91,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=477/500000]
+ train/ActionNoiseL2Loss=0.2302
+ throughput/total_tokens=91,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=478/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=91,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=479/500000]
+ train/ActionNoiseL2Loss=0.2227
+ throughput/total_tokens=91,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=480/500000]
+ optim/total_grad_norm=6.586
+ train/ActionNoiseL2Loss=0.2067
+ throughput/total_tokens=92,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=481/500000]
+ train/ActionNoiseL2Loss=0.2317
+ throughput/total_tokens=92,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=482/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=92,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=483/500000]
+ train/ActionNoiseL2Loss=0.2117
+ throughput/total_tokens=92,736,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=484/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=92,928,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=485/500000]
+ train/ActionNoiseL2Loss=0.2090
+ throughput/total_tokens=93,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=486/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=93,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=487/500000]
+ train/ActionNoiseL2Loss=0.1798
+ throughput/total_tokens=93,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=488/500000]
+ train/ActionNoiseL2Loss=0.1369
+ throughput/total_tokens=93,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=489/500000]
+ train/ActionNoiseL2Loss=0.1915
+ throughput/total_tokens=93,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=490/500000]
+ train/ActionNoiseL2Loss=0.1589
+ throughput/total_tokens=94,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=491/500000]
+ train/ActionNoiseL2Loss=0.1571
+ throughput/total_tokens=94,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=492/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=94,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=493/500000]
+ train/ActionNoiseL2Loss=0.1407
+ throughput/total_tokens=94,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=494/500000]
+ train/ActionNoiseL2Loss=0.1679
+ throughput/total_tokens=94,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=495/500000]
+ train/ActionNoiseL2Loss=0.1828
+ throughput/total_tokens=95,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=496/500000]
+ train/ActionNoiseL2Loss=0.2612
+ throughput/total_tokens=95,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=497/500000]
+ train/ActionNoiseL2Loss=0.1588
+ throughput/total_tokens=95,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=498/500000]
+ train/ActionNoiseL2Loss=0.2024
+ throughput/total_tokens=95,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=499/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=95,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=500/500000]
+ optim/total_grad_norm=4.314
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=96,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+10/11 [19:35:29] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: warnings.py:109
+ FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and
+ set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc:
+ https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial:
+ https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html .
+ warnings.warn(
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:860: UserWarning: warnings.py:109
+ `_get_pg_default_device` will be deprecated, it only stays for backward-compatiblity reason. If you need to find a device for object
+ collectives, please use `_get_object_coll_device`. If you need to query the device types supported by group, please use
+ `_device_capability(group)`.
+ warnings.warn(
+
+10/11 [19:35:32] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:722: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ local_shape = tensor.shape
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:739: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.shape,
+
+ WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:741: FutureWarning: warnings.py:109
+ Please use DTensor instead and we are deprecating ShardedTensor.
+ tensor.dtype,
+
+10/11 [19:35:36] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/overrides.py:1747: FutureWarning: Please use DTensor warnings.py:109
+ instead and we are deprecating ShardedTensor.
+ result = torch_func_method(public_api, types, args, kwargs)
+
+10/11 [19:35:56] INFO | >> Saving config... checkpoint.py:608
+10/11 [19:36:41] INFO | >> Saving model state... checkpoint.py:796
+10/11 [19:37:53] INFO | >> Saving optim state... checkpoint.py:811
+10/11 [19:39:26] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=501/500000]
+ train/ActionNoiseL2Loss=0.1745
+ throughput/total_tokens=96,192,000
+ throughput/device/tokens_per_second=1,121
+ throughput/device/batches_per_second=0.0467
+[step=502/500000]
+ train/ActionNoiseL2Loss=0.1810
+ throughput/total_tokens=96,384,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=503/500000]
+ train/ActionNoiseL2Loss=0.2385
+ throughput/total_tokens=96,576,000
+ throughput/device/tokens_per_second=1,113
+ throughput/device/batches_per_second=0.0464
+[step=504/500000]
+ train/ActionNoiseL2Loss=0.3315
+ throughput/total_tokens=96,768,000
+ throughput/device/tokens_per_second=1,117
+ throughput/device/batches_per_second=0.0466
+[step=505/500000]
+ train/ActionNoiseL2Loss=0.1971
+ throughput/total_tokens=96,960,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0469
+[step=506/500000]
+ train/ActionNoiseL2Loss=0.2301
+ throughput/total_tokens=97,152,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=507/500000]
+ train/ActionNoiseL2Loss=0.1581
+ throughput/total_tokens=97,344,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=508/500000]
+ train/ActionNoiseL2Loss=0.1689
+ throughput/total_tokens=97,536,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=509/500000]
+ train/ActionNoiseL2Loss=0.2296
+ throughput/total_tokens=97,728,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=510/500000]
+ train/ActionNoiseL2Loss=0.2228
+ throughput/total_tokens=97,920,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+ System/Peak GPU Memory (MB)=51,073
+[step=511/500000]
+ train/ActionNoiseL2Loss=0.2334
+ throughput/total_tokens=98,112,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=512/500000]
+ train/ActionNoiseL2Loss=0.2247
+ throughput/total_tokens=98,304,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=513/500000]
+ train/ActionNoiseL2Loss=0.1961
+ throughput/total_tokens=98,496,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=514/500000]
+ train/ActionNoiseL2Loss=0.1523
+ throughput/total_tokens=98,688,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=515/500000]
+ train/ActionNoiseL2Loss=0.2118
+ throughput/total_tokens=98,880,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=516/500000]
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=99,072,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=517/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=99,264,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=518/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=99,456,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=519/500000]
+ train/ActionNoiseL2Loss=0.3211
+ throughput/total_tokens=99,648,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=520/500000]
+ optim/total_grad_norm=5.406
+ train/ActionNoiseL2Loss=0.1276
+ throughput/total_tokens=99,840,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=51,073
+[step=521/500000]
+ train/ActionNoiseL2Loss=0.1698
+ throughput/total_tokens=100,032,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=522/500000]
+ train/ActionNoiseL2Loss=0.1423
+ throughput/total_tokens=100,224,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=523/500000]
+ train/ActionNoiseL2Loss=0.1752
+ throughput/total_tokens=100,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=524/500000]
+ train/ActionNoiseL2Loss=0.2718
+ throughput/total_tokens=100,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=525/500000]
+ train/ActionNoiseL2Loss=0.2544
+ throughput/total_tokens=100,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=526/500000]
+ train/ActionNoiseL2Loss=0.1704
+ throughput/total_tokens=100,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=527/500000]
+ train/ActionNoiseL2Loss=0.2062
+ throughput/total_tokens=101,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=528/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=101,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=529/500000]
+ train/ActionNoiseL2Loss=0.1725
+ throughput/total_tokens=101,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=530/500000]
+ train/ActionNoiseL2Loss=0.3264
+ throughput/total_tokens=101,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=531/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=101,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=532/500000]
+ train/ActionNoiseL2Loss=0.2097
+ throughput/total_tokens=102,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=533/500000]
+ train/ActionNoiseL2Loss=0.3398
+ throughput/total_tokens=102,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=534/500000]
+ train/ActionNoiseL2Loss=0.2442
+ throughput/total_tokens=102,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=535/500000]
+ train/ActionNoiseL2Loss=0.2424
+ throughput/total_tokens=102,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=536/500000]
+ train/ActionNoiseL2Loss=0.2164
+ throughput/total_tokens=102,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=537/500000]
+ train/ActionNoiseL2Loss=0.3170
+ throughput/total_tokens=103,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=538/500000]
+ train/ActionNoiseL2Loss=0.2741
+ throughput/total_tokens=103,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=539/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=103,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=540/500000]
+ optim/total_grad_norm=3.343
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=103,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=541/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=103,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=542/500000]
+ train/ActionNoiseL2Loss=0.1386
+ throughput/total_tokens=104,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=543/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=104,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=544/500000]
+ train/ActionNoiseL2Loss=0.1548
+ throughput/total_tokens=104,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=545/500000]
+ train/ActionNoiseL2Loss=0.1644
+ throughput/total_tokens=104,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=546/500000]
+ train/ActionNoiseL2Loss=0.1364
+ throughput/total_tokens=104,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=547/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=105,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=548/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=105,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=549/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=105,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=550/500000]
+ train/ActionNoiseL2Loss=0.2140
+ throughput/total_tokens=105,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=551/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=105,792,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=552/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=105,984,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=553/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=106,176,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=554/500000]
+ train/ActionNoiseL2Loss=0.1991
+ throughput/total_tokens=106,368,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=555/500000]
+ train/ActionNoiseL2Loss=0.2138
+ throughput/total_tokens=106,560,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=556/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=106,752,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=557/500000]
+ train/ActionNoiseL2Loss=0.2048
+ throughput/total_tokens=106,944,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=558/500000]
+ train/ActionNoiseL2Loss=0.2016
+ throughput/total_tokens=107,136,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=559/500000]
+ train/ActionNoiseL2Loss=0.2360
+ throughput/total_tokens=107,328,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=560/500000]
+ optim/total_grad_norm=4.131
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=107,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=561/500000]
+ train/ActionNoiseL2Loss=0.2263
+ throughput/total_tokens=107,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=562/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=107,904,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=563/500000]
+ train/ActionNoiseL2Loss=0.1911
+ throughput/total_tokens=108,096,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=564/500000]
+ train/ActionNoiseL2Loss=0.1462
+ throughput/total_tokens=108,288,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=565/500000]
+ train/ActionNoiseL2Loss=0.1749
+ throughput/total_tokens=108,480,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=566/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=108,672,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=567/500000]
+ train/ActionNoiseL2Loss=0.1496
+ throughput/total_tokens=108,864,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=568/500000]
+ train/ActionNoiseL2Loss=0.2938
+ throughput/total_tokens=109,056,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=569/500000]
+ train/ActionNoiseL2Loss=0.1602
+ throughput/total_tokens=109,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=570/500000]
+ train/ActionNoiseL2Loss=0.1788
+ throughput/total_tokens=109,440,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=571/500000]
+ train/ActionNoiseL2Loss=0.2028
+ throughput/total_tokens=109,632,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=572/500000]
+ train/ActionNoiseL2Loss=0.1374
+ throughput/total_tokens=109,824,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=573/500000]
+ train/ActionNoiseL2Loss=0.1629
+ throughput/total_tokens=110,016,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=574/500000]
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=110,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=575/500000]
+ train/ActionNoiseL2Loss=0.2033
+ throughput/total_tokens=110,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=576/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=110,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=577/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=110,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=578/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=110,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=579/500000]
+ train/ActionNoiseL2Loss=0.1890
+ throughput/total_tokens=111,168,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=580/500000]
+ optim/total_grad_norm=9.256
+ train/ActionNoiseL2Loss=0.2974
+ throughput/total_tokens=111,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=581/500000]
+ train/ActionNoiseL2Loss=0.3300
+ throughput/total_tokens=111,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=582/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=111,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=583/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=111,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=584/500000]
+ train/ActionNoiseL2Loss=0.1906
+ throughput/total_tokens=112,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=585/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=112,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=586/500000]
+ train/ActionNoiseL2Loss=0.2077
+ throughput/total_tokens=112,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=587/500000]
+ train/ActionNoiseL2Loss=0.1705
+ throughput/total_tokens=112,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=588/500000]
+ train/ActionNoiseL2Loss=0.2178
+ throughput/total_tokens=112,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=589/500000]
+ train/ActionNoiseL2Loss=0.3012
+ throughput/total_tokens=113,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=590/500000]
+ train/ActionNoiseL2Loss=0.2861
+ throughput/total_tokens=113,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=591/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=113,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=592/500000]
+ train/ActionNoiseL2Loss=0.1789
+ throughput/total_tokens=113,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=593/500000]
+ train/ActionNoiseL2Loss=0.1966
+ throughput/total_tokens=113,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=594/500000]
+ train/ActionNoiseL2Loss=0.2309
+ throughput/total_tokens=114,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=595/500000]
+ train/ActionNoiseL2Loss=0.2328
+ throughput/total_tokens=114,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=596/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=114,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=597/500000]
+ train/ActionNoiseL2Loss=0.2496
+ throughput/total_tokens=114,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=598/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=114,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=599/500000]
+ train/ActionNoiseL2Loss=0.2206
+ throughput/total_tokens=115,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=600/500000]
+ optim/total_grad_norm=4.675
+ train/ActionNoiseL2Loss=0.1530
+ throughput/total_tokens=115,200,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=601/500000]
+ train/ActionNoiseL2Loss=0.2215
+ throughput/total_tokens=115,392,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=602/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=115,584,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=603/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=115,776,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=604/500000]
+ train/ActionNoiseL2Loss=0.1786
+ throughput/total_tokens=115,968,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=605/500000]
+ train/ActionNoiseL2Loss=0.1537
+ throughput/total_tokens=116,160,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=606/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=116,352,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=607/500000]
+ train/ActionNoiseL2Loss=0.1690
+ throughput/total_tokens=116,544,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=608/500000]
+ train/ActionNoiseL2Loss=0.1497
+ throughput/total_tokens=116,736,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=609/500000]
+ train/ActionNoiseL2Loss=0.2069
+ throughput/total_tokens=116,928,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=610/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=117,120,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,073
+[step=611/500000]
+ train/ActionNoiseL2Loss=0.1400
+ throughput/total_tokens=117,312,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=612/500000]
+ train/ActionNoiseL2Loss=0.2201
+ throughput/total_tokens=117,504,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=613/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=117,696,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=614/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=117,888,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=615/500000]
+ train/ActionNoiseL2Loss=0.1372
+ throughput/total_tokens=118,080,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=616/500000]
+ train/ActionNoiseL2Loss=0.2042
+ throughput/total_tokens=118,272,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=617/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=118,464,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=618/500000]
+ train/ActionNoiseL2Loss=0.1948
+ throughput/total_tokens=118,656,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=619/500000]
+ train/ActionNoiseL2Loss=0.2450
+ throughput/total_tokens=118,848,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=620/500000]
+ optim/total_grad_norm=3.634
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=119,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=621/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=119,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=622/500000]
+ train/ActionNoiseL2Loss=0.2183
+ throughput/total_tokens=119,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=623/500000]
+ train/ActionNoiseL2Loss=0.2071
+ throughput/total_tokens=119,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=624/500000]
+ train/ActionNoiseL2Loss=0.1697
+ throughput/total_tokens=119,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=625/500000]
+ train/ActionNoiseL2Loss=0.1987
+ throughput/total_tokens=120,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=626/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=120,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=627/500000]
+ train/ActionNoiseL2Loss=0.1358
+ throughput/total_tokens=120,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=628/500000]
+ train/ActionNoiseL2Loss=0.2497
+ throughput/total_tokens=120,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=629/500000]
+ train/ActionNoiseL2Loss=0.2539
+ throughput/total_tokens=120,768,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=630/500000]
+ train/ActionNoiseL2Loss=0.2286
+ throughput/total_tokens=120,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=631/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=121,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=632/500000]
+ train/ActionNoiseL2Loss=0.2696
+ throughput/total_tokens=121,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=633/500000]
+ train/ActionNoiseL2Loss=0.1484
+ throughput/total_tokens=121,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=634/500000]
+ train/ActionNoiseL2Loss=0.1830
+ throughput/total_tokens=121,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=635/500000]
+ train/ActionNoiseL2Loss=0.1570
+ throughput/total_tokens=121,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=636/500000]
+ train/ActionNoiseL2Loss=0.2698
+ throughput/total_tokens=122,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=637/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=122,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=638/500000]
+ train/ActionNoiseL2Loss=0.2378
+ throughput/total_tokens=122,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=639/500000]
+ train/ActionNoiseL2Loss=0.1473
+ throughput/total_tokens=122,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=640/500000]
+ optim/total_grad_norm=2.739
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=122,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=641/500000]
+ train/ActionNoiseL2Loss=0.1993
+ throughput/total_tokens=123,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=642/500000]
+ train/ActionNoiseL2Loss=0.1925
+ throughput/total_tokens=123,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=643/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=123,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=644/500000]
+ train/ActionNoiseL2Loss=0.1884
+ throughput/total_tokens=123,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=645/500000]
+ train/ActionNoiseL2Loss=0.1757
+ throughput/total_tokens=123,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=646/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=124,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=647/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=124,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=648/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=124,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=649/500000]
+ train/ActionNoiseL2Loss=0.1857
+ throughput/total_tokens=124,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=650/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=124,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=651/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=124,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=652/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=125,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=653/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=125,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=654/500000]
+ train/ActionNoiseL2Loss=0.1716
+ throughput/total_tokens=125,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=655/500000]
+ train/ActionNoiseL2Loss=0.2059
+ throughput/total_tokens=125,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=656/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=125,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=657/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=126,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=658/500000]
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=126,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=659/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=126,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=660/500000]
+ optim/total_grad_norm=6.178
+ train/ActionNoiseL2Loss=0.2445
+ throughput/total_tokens=126,720,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=661/500000]
+ train/ActionNoiseL2Loss=0.2099
+ throughput/total_tokens=126,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=662/500000]
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=127,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=663/500000]
+ train/ActionNoiseL2Loss=0.1824
+ throughput/total_tokens=127,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=664/500000]
+ train/ActionNoiseL2Loss=0.2983
+ throughput/total_tokens=127,488,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=665/500000]
+ train/ActionNoiseL2Loss=0.1959
+ throughput/total_tokens=127,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=666/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=127,872,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=667/500000]
+ train/ActionNoiseL2Loss=0.2517
+ throughput/total_tokens=128,064,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=668/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=128,256,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=669/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=128,448,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=670/500000]
+ train/ActionNoiseL2Loss=0.2331
+ throughput/total_tokens=128,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=671/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=128,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=672/500000]
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=129,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=673/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=129,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=674/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=129,408,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=675/500000]
+ train/ActionNoiseL2Loss=0.2027
+ throughput/total_tokens=129,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=676/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=129,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=677/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=129,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=678/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=130,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=679/500000]
+ train/ActionNoiseL2Loss=0.1507
+ throughput/total_tokens=130,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=680/500000]
+ optim/total_grad_norm=6.025
+ train/ActionNoiseL2Loss=0.2513
+ throughput/total_tokens=130,560,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=681/500000]
+ train/ActionNoiseL2Loss=0.2364
+ throughput/total_tokens=130,752,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=682/500000]
+ train/ActionNoiseL2Loss=0.1648
+ throughput/total_tokens=130,944,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=683/500000]
+ train/ActionNoiseL2Loss=0.1339
+ throughput/total_tokens=131,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=684/500000]
+ train/ActionNoiseL2Loss=0.2476
+ throughput/total_tokens=131,328,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=685/500000]
+ train/ActionNoiseL2Loss=0.1807
+ throughput/total_tokens=131,520,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=686/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=131,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=687/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=131,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=688/500000]
+ train/ActionNoiseL2Loss=0.2140
+ throughput/total_tokens=132,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=689/500000]
+ train/ActionNoiseL2Loss=0.1742
+ throughput/total_tokens=132,288,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=690/500000]
+ train/ActionNoiseL2Loss=0.2331
+ throughput/total_tokens=132,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=691/500000]
+ train/ActionNoiseL2Loss=0.1283
+ throughput/total_tokens=132,672,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=692/500000]
+ train/ActionNoiseL2Loss=0.2269
+ throughput/total_tokens=132,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=693/500000]
+ train/ActionNoiseL2Loss=0.2216
+ throughput/total_tokens=133,056,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=694/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=133,248,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=695/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=133,440,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=696/500000]
+ train/ActionNoiseL2Loss=0.3078
+ throughput/total_tokens=133,632,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=697/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=133,824,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=698/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=134,016,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=699/500000]
+ train/ActionNoiseL2Loss=0.2231
+ throughput/total_tokens=134,208,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=700/500000]
+ optim/total_grad_norm=6.181
+ train/ActionNoiseL2Loss=0.1710
+ throughput/total_tokens=134,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=701/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=134,592,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=702/500000]
+ train/ActionNoiseL2Loss=0.1951
+ throughput/total_tokens=134,784,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=703/500000]
+ train/ActionNoiseL2Loss=0.1594
+ throughput/total_tokens=134,976,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=704/500000]
+ train/ActionNoiseL2Loss=0.1579
+ throughput/total_tokens=135,168,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=705/500000]
+ train/ActionNoiseL2Loss=0.1556
+ throughput/total_tokens=135,360,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=706/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=135,552,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=707/500000]
+ train/ActionNoiseL2Loss=0.1829
+ throughput/total_tokens=135,744,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=708/500000]
+ train/ActionNoiseL2Loss=0.1884
+ throughput/total_tokens=135,936,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=709/500000]
+ train/ActionNoiseL2Loss=0.1566
+ throughput/total_tokens=136,128,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=710/500000]
+ train/ActionNoiseL2Loss=0.1961
+ throughput/total_tokens=136,320,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=711/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=136,512,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=712/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=136,704,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=713/500000]
+ train/ActionNoiseL2Loss=0.1975
+ throughput/total_tokens=136,896,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=714/500000]
+ train/ActionNoiseL2Loss=0.1646
+ throughput/total_tokens=137,088,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=715/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=137,280,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=716/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=137,472,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=717/500000]
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=137,664,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=718/500000]
+ train/ActionNoiseL2Loss=0.1994
+ throughput/total_tokens=137,856,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=719/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=138,048,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=720/500000]
+ optim/total_grad_norm=4.220
+ train/ActionNoiseL2Loss=0.1789
+ throughput/total_tokens=138,240,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=721/500000]
+ train/ActionNoiseL2Loss=0.1691
+ throughput/total_tokens=138,432,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=722/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=138,624,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=723/500000]
+ train/ActionNoiseL2Loss=0.2311
+ throughput/total_tokens=138,816,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=724/500000]
+ train/ActionNoiseL2Loss=0.1484
+ throughput/total_tokens=139,008,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=725/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=139,200,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=726/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=139,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=727/500000]
+ train/ActionNoiseL2Loss=0.1819
+ throughput/total_tokens=139,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=728/500000]
+ train/ActionNoiseL2Loss=0.2038
+ throughput/total_tokens=139,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=729/500000]
+ train/ActionNoiseL2Loss=0.1839
+ throughput/total_tokens=139,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=730/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=140,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=731/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=140,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=732/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=140,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=733/500000]
+ train/ActionNoiseL2Loss=0.1876
+ throughput/total_tokens=140,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=734/500000]
+ train/ActionNoiseL2Loss=0.1875
+ throughput/total_tokens=140,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=735/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=141,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=736/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=141,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=737/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=141,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=738/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=141,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=739/500000]
+ train/ActionNoiseL2Loss=0.2031
+ throughput/total_tokens=141,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=740/500000]
+ optim/total_grad_norm=3.914
+ train/ActionNoiseL2Loss=0.1581
+ throughput/total_tokens=142,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=741/500000]
+ train/ActionNoiseL2Loss=0.2009
+ throughput/total_tokens=142,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=742/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=142,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=743/500000]
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=142,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=744/500000]
+ train/ActionNoiseL2Loss=0.1443
+ throughput/total_tokens=142,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=745/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=143,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=746/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=143,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=747/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=143,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=748/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=143,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=749/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=143,808,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=750/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=144,000,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=751/500000]
+ train/ActionNoiseL2Loss=0.1429
+ throughput/total_tokens=144,192,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=752/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=144,384,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=753/500000]
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=144,576,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=754/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=144,768,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=755/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=144,960,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=756/500000]
+ train/ActionNoiseL2Loss=0.1778
+ throughput/total_tokens=145,152,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=757/500000]
+ train/ActionNoiseL2Loss=0.1406
+ throughput/total_tokens=145,344,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=758/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=145,536,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=759/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=145,728,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=760/500000]
+ optim/total_grad_norm=8.067
+ train/ActionNoiseL2Loss=0.2923
+ throughput/total_tokens=145,920,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=761/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=146,112,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=762/500000]
+ train/ActionNoiseL2Loss=0.2418
+ throughput/total_tokens=146,304,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=763/500000]
+ train/ActionNoiseL2Loss=0.1653
+ throughput/total_tokens=146,496,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=764/500000]
+ train/ActionNoiseL2Loss=0.1580
+ throughput/total_tokens=146,688,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=765/500000]
+ train/ActionNoiseL2Loss=0.1504
+ throughput/total_tokens=146,880,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=766/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=147,072,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=767/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=147,264,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=768/500000]
+ train/ActionNoiseL2Loss=0.1509
+ throughput/total_tokens=147,456,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=769/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=147,648,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=770/500000]
+ train/ActionNoiseL2Loss=0.1663
+ throughput/total_tokens=147,840,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=771/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=148,032,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=772/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=148,224,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=773/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=148,416,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=774/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=148,608,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=775/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=148,800,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=776/500000]
+ train/ActionNoiseL2Loss=0.2376
+ throughput/total_tokens=148,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=777/500000]
+ train/ActionNoiseL2Loss=0.1664
+ throughput/total_tokens=149,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=778/500000]
+ train/ActionNoiseL2Loss=0.2315
+ throughput/total_tokens=149,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=779/500000]
+ train/ActionNoiseL2Loss=0.2131
+ throughput/total_tokens=149,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=780/500000]
+ optim/total_grad_norm=5.151
+ train/ActionNoiseL2Loss=0.1975
+ throughput/total_tokens=149,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=781/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=149,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=782/500000]
+ train/ActionNoiseL2Loss=0.2414
+ throughput/total_tokens=150,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=783/500000]
+ train/ActionNoiseL2Loss=0.1907
+ throughput/total_tokens=150,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=784/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=150,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=785/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=150,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=786/500000]
+ train/ActionNoiseL2Loss=0.1263
+ throughput/total_tokens=150,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=787/500000]
+ train/ActionNoiseL2Loss=0.2040
+ throughput/total_tokens=151,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=788/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=151,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=789/500000]
+ train/ActionNoiseL2Loss=0.1859
+ throughput/total_tokens=151,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=790/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=151,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=791/500000]
+ train/ActionNoiseL2Loss=0.1968
+ throughput/total_tokens=151,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=792/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=152,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=793/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=152,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=794/500000]
+ train/ActionNoiseL2Loss=0.2091
+ throughput/total_tokens=152,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=795/500000]
+ train/ActionNoiseL2Loss=0.1613
+ throughput/total_tokens=152,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=796/500000]
+ train/ActionNoiseL2Loss=0.2409
+ throughput/total_tokens=152,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=797/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=153,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=798/500000]
+ train/ActionNoiseL2Loss=0.1593
+ throughput/total_tokens=153,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=799/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=153,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=800/500000]
+ optim/total_grad_norm=4.708
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=153,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=801/500000]
+ train/ActionNoiseL2Loss=0.1790
+ throughput/total_tokens=153,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=802/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=153,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=803/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=154,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=804/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=154,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=805/500000]
+ train/ActionNoiseL2Loss=0.1459
+ throughput/total_tokens=154,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=806/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=154,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=807/500000]
+ train/ActionNoiseL2Loss=0.1308
+ throughput/total_tokens=154,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=808/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=155,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=809/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=155,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=810/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=155,520,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=811/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=155,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=812/500000]
+ train/ActionNoiseL2Loss=0.2035
+ throughput/total_tokens=155,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=813/500000]
+ train/ActionNoiseL2Loss=0.1711
+ throughput/total_tokens=156,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=814/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=156,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=815/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=156,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=816/500000]
+ train/ActionNoiseL2Loss=0.1960
+ throughput/total_tokens=156,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=817/500000]
+ train/ActionNoiseL2Loss=0.1780
+ throughput/total_tokens=156,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=818/500000]
+ train/ActionNoiseL2Loss=0.1791
+ throughput/total_tokens=157,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=819/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=157,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=820/500000]
+ optim/total_grad_norm=3.605
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=157,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=821/500000]
+ train/ActionNoiseL2Loss=0.1980
+ throughput/total_tokens=157,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=822/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=157,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=823/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=158,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=824/500000]
+ train/ActionNoiseL2Loss=0.1369
+ throughput/total_tokens=158,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=825/500000]
+ train/ActionNoiseL2Loss=0.1743
+ throughput/total_tokens=158,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=826/500000]
+ train/ActionNoiseL2Loss=0.1961
+ throughput/total_tokens=158,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=827/500000]
+ train/ActionNoiseL2Loss=0.1735
+ throughput/total_tokens=158,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=828/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=158,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=829/500000]
+ train/ActionNoiseL2Loss=0.1257
+ throughput/total_tokens=159,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=830/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=159,360,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=831/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=159,552,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=832/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=159,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=833/500000]
+ train/ActionNoiseL2Loss=0.1886
+ throughput/total_tokens=159,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=834/500000]
+ train/ActionNoiseL2Loss=0.2061
+ throughput/total_tokens=160,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=835/500000]
+ train/ActionNoiseL2Loss=0.1618
+ throughput/total_tokens=160,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=836/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=160,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=837/500000]
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=160,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=838/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=160,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=839/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=161,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=840/500000]
+ optim/total_grad_norm=3.912
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=161,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=841/500000]
+ train/ActionNoiseL2Loss=0.2021
+ throughput/total_tokens=161,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=842/500000]
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=161,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=843/500000]
+ train/ActionNoiseL2Loss=0.1304
+ throughput/total_tokens=161,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=844/500000]
+ train/ActionNoiseL2Loss=0.1667
+ throughput/total_tokens=162,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=845/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=162,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=846/500000]
+ train/ActionNoiseL2Loss=0.1403
+ throughput/total_tokens=162,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=847/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=162,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=848/500000]
+ train/ActionNoiseL2Loss=0.1631
+ throughput/total_tokens=162,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=849/500000]
+ train/ActionNoiseL2Loss=0.1888
+ throughput/total_tokens=163,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=850/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=163,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=851/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=163,392,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=852/500000]
+ train/ActionNoiseL2Loss=0.1882
+ throughput/total_tokens=163,584,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=853/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=163,776,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=854/500000]
+ train/ActionNoiseL2Loss=0.1448
+ throughput/total_tokens=163,968,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=855/500000]
+ train/ActionNoiseL2Loss=0.2379
+ throughput/total_tokens=164,160,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=856/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=164,352,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=857/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=164,544,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=858/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=164,736,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=859/500000]
+ train/ActionNoiseL2Loss=0.3540
+ throughput/total_tokens=164,928,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=860/500000]
+ optim/total_grad_norm=5.595
+ train/ActionNoiseL2Loss=0.2175
+ throughput/total_tokens=165,120,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=861/500000]
+ train/ActionNoiseL2Loss=0.2135
+ throughput/total_tokens=165,312,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=862/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=165,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=863/500000]
+ train/ActionNoiseL2Loss=0.2297
+ throughput/total_tokens=165,696,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=864/500000]
+ train/ActionNoiseL2Loss=0.1987
+ throughput/total_tokens=165,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=865/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=166,080,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=866/500000]
+ train/ActionNoiseL2Loss=0.3250
+ throughput/total_tokens=166,272,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=867/500000]
+ train/ActionNoiseL2Loss=0.1897
+ throughput/total_tokens=166,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=868/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=166,656,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=869/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=166,848,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=870/500000]
+ train/ActionNoiseL2Loss=0.1542
+ throughput/total_tokens=167,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=871/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=167,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=872/500000]
+ train/ActionNoiseL2Loss=0.2048
+ throughput/total_tokens=167,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=873/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=167,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=874/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=167,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=875/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=168,000,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=876/500000]
+ train/ActionNoiseL2Loss=0.1502
+ throughput/total_tokens=168,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=877/500000]
+ train/ActionNoiseL2Loss=0.1913
+ throughput/total_tokens=168,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=878/500000]
+ train/ActionNoiseL2Loss=0.1752
+ throughput/total_tokens=168,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=879/500000]
+ train/ActionNoiseL2Loss=0.1377
+ throughput/total_tokens=168,768,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=880/500000]
+ optim/total_grad_norm=4.807
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=168,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=881/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=169,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=882/500000]
+ train/ActionNoiseL2Loss=0.2085
+ throughput/total_tokens=169,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=883/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=169,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=884/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=169,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=885/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=169,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=886/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=170,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=887/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=170,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=888/500000]
+ train/ActionNoiseL2Loss=0.2218
+ throughput/total_tokens=170,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=889/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=170,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=890/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=170,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=891/500000]
+ train/ActionNoiseL2Loss=0.1755
+ throughput/total_tokens=171,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=892/500000]
+ train/ActionNoiseL2Loss=0.1425
+ throughput/total_tokens=171,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=893/500000]
+ train/ActionNoiseL2Loss=0.1228
+ throughput/total_tokens=171,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=894/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=171,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=895/500000]
+ train/ActionNoiseL2Loss=0.1596
+ throughput/total_tokens=171,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=896/500000]
+ train/ActionNoiseL2Loss=0.1370
+ throughput/total_tokens=172,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=897/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=172,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=898/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=172,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=899/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=172,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=900/500000]
+ optim/total_grad_norm=2.379
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=172,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=901/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=172,992,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=902/500000]
+ train/ActionNoiseL2Loss=0.1661
+ throughput/total_tokens=173,184,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=903/500000]
+ train/ActionNoiseL2Loss=0.1240
+ throughput/total_tokens=173,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=904/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=173,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=905/500000]
+ train/ActionNoiseL2Loss=0.1493
+ throughput/total_tokens=173,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=906/500000]
+ train/ActionNoiseL2Loss=0.1626
+ throughput/total_tokens=173,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=907/500000]
+ train/ActionNoiseL2Loss=0.1390
+ throughput/total_tokens=174,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=908/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=174,336,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=909/500000]
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=174,528,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=910/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=174,720,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=911/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=174,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=912/500000]
+ train/ActionNoiseL2Loss=0.1597
+ throughput/total_tokens=175,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=913/500000]
+ train/ActionNoiseL2Loss=0.1520
+ throughput/total_tokens=175,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=914/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=175,488,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=915/500000]
+ train/ActionNoiseL2Loss=0.1650
+ throughput/total_tokens=175,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=916/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=175,872,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=917/500000]
+ train/ActionNoiseL2Loss=0.1925
+ throughput/total_tokens=176,064,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=918/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=176,256,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=919/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=176,448,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=920/500000]
+ optim/total_grad_norm=4.888
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=176,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=921/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=176,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=922/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=177,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=923/500000]
+ train/ActionNoiseL2Loss=0.1664
+ throughput/total_tokens=177,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=924/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=177,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=925/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=177,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=926/500000]
+ train/ActionNoiseL2Loss=0.1631
+ throughput/total_tokens=177,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=927/500000]
+ train/ActionNoiseL2Loss=0.1704
+ throughput/total_tokens=177,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=928/500000]
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=178,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=929/500000]
+ train/ActionNoiseL2Loss=0.1747
+ throughput/total_tokens=178,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=930/500000]
+ train/ActionNoiseL2Loss=0.1871
+ throughput/total_tokens=178,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=931/500000]
+ train/ActionNoiseL2Loss=0.2440
+ throughput/total_tokens=178,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=932/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=178,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=933/500000]
+ train/ActionNoiseL2Loss=0.2380
+ throughput/total_tokens=179,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=934/500000]
+ train/ActionNoiseL2Loss=0.1784
+ throughput/total_tokens=179,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=935/500000]
+ train/ActionNoiseL2Loss=0.1663
+ throughput/total_tokens=179,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=936/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=179,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=937/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=179,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=938/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=180,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=939/500000]
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=180,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=940/500000]
+ optim/total_grad_norm=3.377
+ train/ActionNoiseL2Loss=0.1640
+ throughput/total_tokens=180,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=941/500000]
+ train/ActionNoiseL2Loss=0.1290
+ throughput/total_tokens=180,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=942/500000]
+ train/ActionNoiseL2Loss=0.2613
+ throughput/total_tokens=180,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=943/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=181,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=944/500000]
+ train/ActionNoiseL2Loss=0.1537
+ throughput/total_tokens=181,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=945/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=181,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=946/500000]
+ train/ActionNoiseL2Loss=0.1817
+ throughput/total_tokens=181,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=947/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=181,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=948/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=182,016,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=949/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=182,208,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=950/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=182,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=951/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=182,592,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=952/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=182,784,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=953/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=182,976,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=954/500000]
+ train/ActionNoiseL2Loss=0.1531
+ throughput/total_tokens=183,168,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=955/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=183,360,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=956/500000]
+ train/ActionNoiseL2Loss=0.2742
+ throughput/total_tokens=183,552,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=957/500000]
+ train/ActionNoiseL2Loss=0.1850
+ throughput/total_tokens=183,744,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=958/500000]
+ train/ActionNoiseL2Loss=0.2276
+ throughput/total_tokens=183,936,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=959/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=184,128,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=960/500000]
+ optim/total_grad_norm=3.597
+ train/ActionNoiseL2Loss=0.1547
+ throughput/total_tokens=184,320,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=961/500000]
+ train/ActionNoiseL2Loss=0.1500
+ throughput/total_tokens=184,512,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=962/500000]
+ train/ActionNoiseL2Loss=0.1239
+ throughput/total_tokens=184,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=963/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=184,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=964/500000]
+ train/ActionNoiseL2Loss=0.1675
+ throughput/total_tokens=185,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=965/500000]
+ train/ActionNoiseL2Loss=0.1815
+ throughput/total_tokens=185,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=966/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=185,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=967/500000]
+ train/ActionNoiseL2Loss=0.1923
+ throughput/total_tokens=185,664,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=968/500000]
+ train/ActionNoiseL2Loss=0.1858
+ throughput/total_tokens=185,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=969/500000]
+ train/ActionNoiseL2Loss=0.1661
+ throughput/total_tokens=186,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=970/500000]
+ train/ActionNoiseL2Loss=0.2107
+ throughput/total_tokens=186,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=971/500000]
+ train/ActionNoiseL2Loss=0.1424
+ throughput/total_tokens=186,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=972/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=186,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=973/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=186,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=974/500000]
+ train/ActionNoiseL2Loss=0.1933
+ throughput/total_tokens=187,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=975/500000]
+ train/ActionNoiseL2Loss=0.2020
+ throughput/total_tokens=187,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=976/500000]
+ train/ActionNoiseL2Loss=0.2004
+ throughput/total_tokens=187,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=977/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=187,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=978/500000]
+ train/ActionNoiseL2Loss=0.1682
+ throughput/total_tokens=187,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=979/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=187,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=980/500000]
+ optim/total_grad_norm=3.558
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=188,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=981/500000]
+ train/ActionNoiseL2Loss=0.1853
+ throughput/total_tokens=188,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=982/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=188,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=983/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=188,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=984/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=188,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=985/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=189,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=986/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=189,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=987/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=189,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=988/500000]
+ train/ActionNoiseL2Loss=0.1621
+ throughput/total_tokens=189,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=989/500000]
+ train/ActionNoiseL2Loss=0.1419
+ throughput/total_tokens=189,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=990/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=190,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=991/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=190,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=992/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=190,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=993/500000]
+ train/ActionNoiseL2Loss=0.1733
+ throughput/total_tokens=190,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=994/500000]
+ train/ActionNoiseL2Loss=0.2071
+ throughput/total_tokens=190,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=995/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=191,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=996/500000]
+ train/ActionNoiseL2Loss=0.2171
+ throughput/total_tokens=191,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=997/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=191,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=998/500000]
+ train/ActionNoiseL2Loss=0.1589
+ throughput/total_tokens=191,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=999/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=191,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1000/500000]
+ optim/total_grad_norm=5.347
+ train/ActionNoiseL2Loss=0.1843
+ throughput/total_tokens=192,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+10/11 [22:34:47] INFO | >> Saving config... checkpoint.py:608
+10/11 [22:35:21] INFO | >> Saving model state... checkpoint.py:796
+10/11 [22:36:27] INFO | >> Saving optim state... checkpoint.py:811
+10/11 [22:37:59] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1001/500000]
+ train/ActionNoiseL2Loss=0.2418
+ throughput/total_tokens=192,192,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=1002/500000]
+ train/ActionNoiseL2Loss=0.1764
+ throughput/total_tokens=192,384,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=1003/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=192,576,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=1004/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=192,768,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=1005/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=192,960,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=1006/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=193,152,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1007/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=193,344,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=1008/500000]
+ train/ActionNoiseL2Loss=0.1538
+ throughput/total_tokens=193,536,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=1009/500000]
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=193,728,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=1010/500000]
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=193,920,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,073
+[step=1011/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=194,112,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=1012/500000]
+ train/ActionNoiseL2Loss=0.1754
+ throughput/total_tokens=194,304,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1013/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=194,496,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1014/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=194,688,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1015/500000]
+ train/ActionNoiseL2Loss=0.1758
+ throughput/total_tokens=194,880,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1016/500000]
+ train/ActionNoiseL2Loss=0.1589
+ throughput/total_tokens=195,072,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1017/500000]
+ train/ActionNoiseL2Loss=0.2122
+ throughput/total_tokens=195,264,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1018/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=195,456,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1019/500000]
+ train/ActionNoiseL2Loss=0.1548
+ throughput/total_tokens=195,648,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1020/500000]
+ optim/total_grad_norm=5.447
+ train/ActionNoiseL2Loss=0.1634
+ throughput/total_tokens=195,840,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=1021/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=196,032,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1022/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=196,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1023/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=196,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1024/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=196,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1025/500000]
+ train/ActionNoiseL2Loss=0.1524
+ throughput/total_tokens=196,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1026/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=196,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1027/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=197,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1028/500000]
+ train/ActionNoiseL2Loss=0.1887
+ throughput/total_tokens=197,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1029/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=197,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1030/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=197,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1031/500000]
+ train/ActionNoiseL2Loss=0.1495
+ throughput/total_tokens=197,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1032/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=198,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1033/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=198,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1034/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=198,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1035/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=198,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1036/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=198,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1037/500000]
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=199,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1038/500000]
+ train/ActionNoiseL2Loss=0.1388
+ throughput/total_tokens=199,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1039/500000]
+ train/ActionNoiseL2Loss=0.1225
+ throughput/total_tokens=199,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1040/500000]
+ optim/total_grad_norm=4.718
+ train/ActionNoiseL2Loss=0.1729
+ throughput/total_tokens=199,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1041/500000]
+ train/ActionNoiseL2Loss=0.1829
+ throughput/total_tokens=199,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1042/500000]
+ train/ActionNoiseL2Loss=0.1345
+ throughput/total_tokens=200,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1043/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=200,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1044/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=200,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1045/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=200,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1046/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=200,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1047/500000]
+ train/ActionNoiseL2Loss=0.1784
+ throughput/total_tokens=201,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1048/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=201,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1049/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=201,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1050/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=201,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1051/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=201,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1052/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=201,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1053/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=202,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1054/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=202,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1055/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=202,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1056/500000]
+ train/ActionNoiseL2Loss=0.1886
+ throughput/total_tokens=202,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1057/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=202,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1058/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=203,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1059/500000]
+ train/ActionNoiseL2Loss=0.1979
+ throughput/total_tokens=203,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1060/500000]
+ optim/total_grad_norm=3.181
+ train/ActionNoiseL2Loss=0.1605
+ throughput/total_tokens=203,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1061/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=203,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1062/500000]
+ train/ActionNoiseL2Loss=0.2076
+ throughput/total_tokens=203,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1063/500000]
+ train/ActionNoiseL2Loss=0.1488
+ throughput/total_tokens=204,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1064/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=204,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1065/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=204,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1066/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=204,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1067/500000]
+ train/ActionNoiseL2Loss=0.2383
+ throughput/total_tokens=204,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1068/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=205,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1069/500000]
+ train/ActionNoiseL2Loss=0.2033
+ throughput/total_tokens=205,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1070/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=205,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1071/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=205,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1072/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=205,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1073/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=206,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1074/500000]
+ train/ActionNoiseL2Loss=0.1399
+ throughput/total_tokens=206,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1075/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=206,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1076/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=206,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1077/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=206,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1078/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=206,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1079/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=207,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1080/500000]
+ optim/total_grad_norm=3.465
+ train/ActionNoiseL2Loss=0.1764
+ throughput/total_tokens=207,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1081/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=207,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1082/500000]
+ train/ActionNoiseL2Loss=0.1453
+ throughput/total_tokens=207,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1083/500000]
+ train/ActionNoiseL2Loss=0.1741
+ throughput/total_tokens=207,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1084/500000]
+ train/ActionNoiseL2Loss=0.1673
+ throughput/total_tokens=208,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1085/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=208,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1086/500000]
+ train/ActionNoiseL2Loss=0.1664
+ throughput/total_tokens=208,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1087/500000]
+ train/ActionNoiseL2Loss=0.1411
+ throughput/total_tokens=208,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1088/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=208,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1089/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=209,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1090/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=209,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1091/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=209,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1092/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=209,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1093/500000]
+ train/ActionNoiseL2Loss=0.1692
+ throughput/total_tokens=209,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1094/500000]
+ train/ActionNoiseL2Loss=0.1771
+ throughput/total_tokens=210,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1095/500000]
+ train/ActionNoiseL2Loss=0.1821
+ throughput/total_tokens=210,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1096/500000]
+ train/ActionNoiseL2Loss=0.1307
+ throughput/total_tokens=210,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1097/500000]
+ train/ActionNoiseL2Loss=0.1408
+ throughput/total_tokens=210,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1098/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=210,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1099/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=211,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1100/500000]
+ optim/total_grad_norm=2.192
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=211,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1101/500000]
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=211,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1102/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=211,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1103/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=211,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1104/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=211,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1105/500000]
+ train/ActionNoiseL2Loss=0.1239
+ throughput/total_tokens=212,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1106/500000]
+ train/ActionNoiseL2Loss=0.2511
+ throughput/total_tokens=212,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1107/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=212,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1108/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=212,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1109/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=212,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1110/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=213,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1111/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=213,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1112/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=213,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1113/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=213,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1114/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=213,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1115/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=214,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1116/500000]
+ train/ActionNoiseL2Loss=0.2225
+ throughput/total_tokens=214,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1117/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=214,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1118/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=214,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1119/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=214,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1120/500000]
+ optim/total_grad_norm=3.384
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=215,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1121/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=215,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1122/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=215,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1123/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=215,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1124/500000]
+ train/ActionNoiseL2Loss=0.2833
+ throughput/total_tokens=215,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1125/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=216,000,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1126/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=216,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1127/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=216,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1128/500000]
+ train/ActionNoiseL2Loss=0.1317
+ throughput/total_tokens=216,576,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1129/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=216,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1130/500000]
+ train/ActionNoiseL2Loss=0.1630
+ throughput/total_tokens=216,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1131/500000]
+ train/ActionNoiseL2Loss=0.2172
+ throughput/total_tokens=217,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1132/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=217,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1133/500000]
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=217,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1134/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=217,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1135/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=217,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1136/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=218,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1137/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=218,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1138/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=218,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1139/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=218,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1140/500000]
+ optim/total_grad_norm=5.340
+ train/ActionNoiseL2Loss=0.2553
+ throughput/total_tokens=218,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1141/500000]
+ train/ActionNoiseL2Loss=0.2928
+ throughput/total_tokens=219,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1142/500000]
+ train/ActionNoiseL2Loss=0.1513
+ throughput/total_tokens=219,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1143/500000]
+ train/ActionNoiseL2Loss=0.1878
+ throughput/total_tokens=219,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1144/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=219,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1145/500000]
+ train/ActionNoiseL2Loss=0.2140
+ throughput/total_tokens=219,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1146/500000]
+ train/ActionNoiseL2Loss=0.2253
+ throughput/total_tokens=220,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1147/500000]
+ train/ActionNoiseL2Loss=0.2222
+ throughput/total_tokens=220,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1148/500000]
+ train/ActionNoiseL2Loss=0.1737
+ throughput/total_tokens=220,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1149/500000]
+ train/ActionNoiseL2Loss=0.1986
+ throughput/total_tokens=220,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1150/500000]
+ train/ActionNoiseL2Loss=0.1382
+ throughput/total_tokens=220,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1151/500000]
+ train/ActionNoiseL2Loss=0.1571
+ throughput/total_tokens=220,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1152/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=221,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1153/500000]
+ train/ActionNoiseL2Loss=0.1686
+ throughput/total_tokens=221,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1154/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=221,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1155/500000]
+ train/ActionNoiseL2Loss=0.1841
+ throughput/total_tokens=221,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1156/500000]
+ train/ActionNoiseL2Loss=0.2585
+ throughput/total_tokens=221,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1157/500000]
+ train/ActionNoiseL2Loss=0.2310
+ throughput/total_tokens=222,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1158/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=222,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1159/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=222,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1160/500000]
+ optim/total_grad_norm=2.761
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=222,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1161/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=222,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1162/500000]
+ train/ActionNoiseL2Loss=0.1815
+ throughput/total_tokens=223,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1163/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=223,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1164/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=223,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1165/500000]
+ train/ActionNoiseL2Loss=0.1583
+ throughput/total_tokens=223,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1166/500000]
+ train/ActionNoiseL2Loss=0.1475
+ throughput/total_tokens=223,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1167/500000]
+ train/ActionNoiseL2Loss=0.2635
+ throughput/total_tokens=224,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1168/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=224,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1169/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=224,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1170/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=224,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1171/500000]
+ train/ActionNoiseL2Loss=0.3400
+ throughput/total_tokens=224,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1172/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=225,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1173/500000]
+ train/ActionNoiseL2Loss=0.1522
+ throughput/total_tokens=225,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1174/500000]
+ train/ActionNoiseL2Loss=0.2013
+ throughput/total_tokens=225,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1175/500000]
+ train/ActionNoiseL2Loss=0.1593
+ throughput/total_tokens=225,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1176/500000]
+ train/ActionNoiseL2Loss=0.1432
+ throughput/total_tokens=225,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1177/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=225,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1178/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=226,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1179/500000]
+ train/ActionNoiseL2Loss=0.1667
+ throughput/total_tokens=226,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1180/500000]
+ optim/total_grad_norm=3.219
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=226,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1181/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=226,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1182/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=226,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1183/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=227,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1184/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=227,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1185/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=227,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1186/500000]
+ train/ActionNoiseL2Loss=0.2159
+ throughput/total_tokens=227,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1187/500000]
+ train/ActionNoiseL2Loss=0.2451
+ throughput/total_tokens=227,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1188/500000]
+ train/ActionNoiseL2Loss=0.2176
+ throughput/total_tokens=228,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1189/500000]
+ train/ActionNoiseL2Loss=0.1693
+ throughput/total_tokens=228,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1190/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=228,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1191/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=228,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1192/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=228,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1193/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=229,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1194/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=229,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1195/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=229,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1196/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=229,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1197/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=229,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1198/500000]
+ train/ActionNoiseL2Loss=0.1543
+ throughput/total_tokens=230,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1199/500000]
+ train/ActionNoiseL2Loss=0.1471
+ throughput/total_tokens=230,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1200/500000]
+ optim/total_grad_norm=3.015
+ train/ActionNoiseL2Loss=0.1246
+ throughput/total_tokens=230,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,073
+[step=1201/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=230,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1202/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=230,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1203/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=230,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1204/500000]
+ train/ActionNoiseL2Loss=0.1746
+ throughput/total_tokens=231,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1205/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=231,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1206/500000]
+ train/ActionNoiseL2Loss=0.1582
+ throughput/total_tokens=231,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1207/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=231,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1208/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=231,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1209/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=232,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1210/500000]
+ train/ActionNoiseL2Loss=0.1437
+ throughput/total_tokens=232,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1211/500000]
+ train/ActionNoiseL2Loss=0.2255
+ throughput/total_tokens=232,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1212/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=232,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1213/500000]
+ train/ActionNoiseL2Loss=0.1846
+ throughput/total_tokens=232,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1214/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=233,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1215/500000]
+ train/ActionNoiseL2Loss=0.2033
+ throughput/total_tokens=233,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1216/500000]
+ train/ActionNoiseL2Loss=0.1976
+ throughput/total_tokens=233,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1217/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=233,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1218/500000]
+ train/ActionNoiseL2Loss=0.1721
+ throughput/total_tokens=233,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1219/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=234,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1220/500000]
+ optim/total_grad_norm=2.294
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=234,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1221/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=234,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1222/500000]
+ train/ActionNoiseL2Loss=0.2085
+ throughput/total_tokens=234,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1223/500000]
+ train/ActionNoiseL2Loss=0.1448
+ throughput/total_tokens=234,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1224/500000]
+ train/ActionNoiseL2Loss=0.1450
+ throughput/total_tokens=235,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1225/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=235,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1226/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=235,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1227/500000]
+ train/ActionNoiseL2Loss=0.1681
+ throughput/total_tokens=235,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1228/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=235,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1229/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=235,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1230/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=236,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1231/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=236,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1232/500000]
+ train/ActionNoiseL2Loss=0.1821
+ throughput/total_tokens=236,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1233/500000]
+ train/ActionNoiseL2Loss=0.1488
+ throughput/total_tokens=236,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1234/500000]
+ train/ActionNoiseL2Loss=0.2152
+ throughput/total_tokens=236,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1235/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=237,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1236/500000]
+ train/ActionNoiseL2Loss=0.2159
+ throughput/total_tokens=237,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1237/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=237,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1238/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=237,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1239/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=237,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1240/500000]
+ optim/total_grad_norm=4.241
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=238,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1241/500000]
+ train/ActionNoiseL2Loss=0.1348
+ throughput/total_tokens=238,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1242/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=238,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1243/500000]
+ train/ActionNoiseL2Loss=0.1719
+ throughput/total_tokens=238,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1244/500000]
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=238,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1245/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=239,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1246/500000]
+ train/ActionNoiseL2Loss=0.1623
+ throughput/total_tokens=239,232,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1247/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=239,424,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1248/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=239,616,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1249/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=239,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1250/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=240,000,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1251/500000]
+ train/ActionNoiseL2Loss=0.1549
+ throughput/total_tokens=240,192,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1252/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=240,384,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1253/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=240,576,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1254/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=240,768,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1255/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=240,960,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1256/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=241,152,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1257/500000]
+ train/ActionNoiseL2Loss=0.1453
+ throughput/total_tokens=241,344,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1258/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=241,536,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1259/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=241,728,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1260/500000]
+ optim/total_grad_norm=3.371
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=241,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=1261/500000]
+ train/ActionNoiseL2Loss=0.1518
+ throughput/total_tokens=242,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1262/500000]
+ train/ActionNoiseL2Loss=0.1809
+ throughput/total_tokens=242,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1263/500000]
+ train/ActionNoiseL2Loss=0.1276
+ throughput/total_tokens=242,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1264/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=242,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1265/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=242,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1266/500000]
+ train/ActionNoiseL2Loss=0.1308
+ throughput/total_tokens=243,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1267/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=243,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1268/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=243,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1269/500000]
+ train/ActionNoiseL2Loss=0.1753
+ throughput/total_tokens=243,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1270/500000]
+ train/ActionNoiseL2Loss=0.1858
+ throughput/total_tokens=243,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1271/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=244,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1272/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=244,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1273/500000]
+ train/ActionNoiseL2Loss=0.1461
+ throughput/total_tokens=244,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1274/500000]
+ train/ActionNoiseL2Loss=0.1874
+ throughput/total_tokens=244,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1275/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=244,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1276/500000]
+ train/ActionNoiseL2Loss=0.1699
+ throughput/total_tokens=244,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1277/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=245,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1278/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=245,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1279/500000]
+ train/ActionNoiseL2Loss=0.1779
+ throughput/total_tokens=245,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1280/500000]
+ optim/total_grad_norm=2.632
+ train/ActionNoiseL2Loss=0.1271
+ throughput/total_tokens=245,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1281/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=245,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1282/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=246,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1283/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=246,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1284/500000]
+ train/ActionNoiseL2Loss=0.1476
+ throughput/total_tokens=246,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1285/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=246,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1286/500000]
+ train/ActionNoiseL2Loss=0.1692
+ throughput/total_tokens=246,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1287/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=247,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1288/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=247,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1289/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=247,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1290/500000]
+ train/ActionNoiseL2Loss=0.1662
+ throughput/total_tokens=247,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1291/500000]
+ train/ActionNoiseL2Loss=0.2090
+ throughput/total_tokens=247,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1292/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=248,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1293/500000]
+ train/ActionNoiseL2Loss=0.1910
+ throughput/total_tokens=248,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1294/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=248,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1295/500000]
+ train/ActionNoiseL2Loss=0.1676
+ throughput/total_tokens=248,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1296/500000]
+ train/ActionNoiseL2Loss=0.1971
+ throughput/total_tokens=248,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1297/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=249,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1298/500000]
+ train/ActionNoiseL2Loss=0.1825
+ throughput/total_tokens=249,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1299/500000]
+ train/ActionNoiseL2Loss=0.1435
+ throughput/total_tokens=249,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1300/500000]
+ optim/total_grad_norm=2.137
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=249,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1301/500000]
+ train/ActionNoiseL2Loss=0.1292
+ throughput/total_tokens=249,792,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1302/500000]
+ train/ActionNoiseL2Loss=0.1238
+ throughput/total_tokens=249,984,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1303/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=250,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1304/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=250,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1305/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=250,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1306/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=250,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1307/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=250,944,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1308/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=251,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1309/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=251,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1310/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=251,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=1311/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=251,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1312/500000]
+ train/ActionNoiseL2Loss=0.1351
+ throughput/total_tokens=251,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1313/500000]
+ train/ActionNoiseL2Loss=0.1179
+ throughput/total_tokens=252,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1314/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=252,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1315/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=252,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1316/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=252,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1317/500000]
+ train/ActionNoiseL2Loss=0.1179
+ throughput/total_tokens=252,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1318/500000]
+ train/ActionNoiseL2Loss=0.1628
+ throughput/total_tokens=253,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1319/500000]
+ train/ActionNoiseL2Loss=0.1833
+ throughput/total_tokens=253,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1320/500000]
+ optim/total_grad_norm=3.496
+ train/ActionNoiseL2Loss=0.1769
+ throughput/total_tokens=253,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1321/500000]
+ train/ActionNoiseL2Loss=0.1728
+ throughput/total_tokens=253,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1322/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=253,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1323/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=254,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1324/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=254,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1325/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=254,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1326/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=254,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1327/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=254,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1328/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=254,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1329/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=255,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1330/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=255,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1331/500000]
+ train/ActionNoiseL2Loss=0.1648
+ throughput/total_tokens=255,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1332/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=255,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1333/500000]
+ train/ActionNoiseL2Loss=0.1855
+ throughput/total_tokens=255,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1334/500000]
+ train/ActionNoiseL2Loss=0.1586
+ throughput/total_tokens=256,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1335/500000]
+ train/ActionNoiseL2Loss=0.1453
+ throughput/total_tokens=256,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1336/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=256,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1337/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=256,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1338/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=256,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1339/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=257,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1340/500000]
+ optim/total_grad_norm=2.078
+ train/ActionNoiseL2Loss=0.1342
+ throughput/total_tokens=257,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1341/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=257,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1342/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=257,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1343/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=257,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1344/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=258,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1345/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=258,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1346/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=258,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1347/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=258,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1348/500000]
+ train/ActionNoiseL2Loss=0.2649
+ throughput/total_tokens=258,816,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1349/500000]
+ train/ActionNoiseL2Loss=0.1796
+ throughput/total_tokens=259,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1350/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=259,200,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1351/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=259,392,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1352/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=259,584,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1353/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=259,776,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1354/500000]
+ train/ActionNoiseL2Loss=0.2186
+ throughput/total_tokens=259,968,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1355/500000]
+ train/ActionNoiseL2Loss=0.1544
+ throughput/total_tokens=260,160,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1356/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=260,352,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1357/500000]
+ train/ActionNoiseL2Loss=0.1358
+ throughput/total_tokens=260,544,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1358/500000]
+ train/ActionNoiseL2Loss=0.1959
+ throughput/total_tokens=260,736,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1359/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=260,928,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1360/500000]
+ optim/total_grad_norm=3.035
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=261,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1361/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=261,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1362/500000]
+ train/ActionNoiseL2Loss=0.1653
+ throughput/total_tokens=261,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1363/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=261,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1364/500000]
+ train/ActionNoiseL2Loss=0.1572
+ throughput/total_tokens=261,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1365/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=262,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1366/500000]
+ train/ActionNoiseL2Loss=0.1345
+ throughput/total_tokens=262,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1367/500000]
+ train/ActionNoiseL2Loss=0.1510
+ throughput/total_tokens=262,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1368/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=262,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1369/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=262,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1370/500000]
+ train/ActionNoiseL2Loss=0.2792
+ throughput/total_tokens=263,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1371/500000]
+ train/ActionNoiseL2Loss=0.1357
+ throughput/total_tokens=263,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1372/500000]
+ train/ActionNoiseL2Loss=0.2167
+ throughput/total_tokens=263,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1373/500000]
+ train/ActionNoiseL2Loss=0.1784
+ throughput/total_tokens=263,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1374/500000]
+ train/ActionNoiseL2Loss=0.1758
+ throughput/total_tokens=263,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1375/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=264,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1376/500000]
+ train/ActionNoiseL2Loss=0.1449
+ throughput/total_tokens=264,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1377/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=264,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1378/500000]
+ train/ActionNoiseL2Loss=0.1599
+ throughput/total_tokens=264,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1379/500000]
+ train/ActionNoiseL2Loss=0.1828
+ throughput/total_tokens=264,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1380/500000]
+ optim/total_grad_norm=3.128
+ train/ActionNoiseL2Loss=0.1257
+ throughput/total_tokens=264,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1381/500000]
+ train/ActionNoiseL2Loss=0.1912
+ throughput/total_tokens=265,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1382/500000]
+ train/ActionNoiseL2Loss=0.2555
+ throughput/total_tokens=265,344,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1383/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=265,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1384/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=265,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1385/500000]
+ train/ActionNoiseL2Loss=0.1313
+ throughput/total_tokens=265,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1386/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=266,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1387/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=266,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1388/500000]
+ train/ActionNoiseL2Loss=0.1639
+ throughput/total_tokens=266,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1389/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=266,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1390/500000]
+ train/ActionNoiseL2Loss=0.1595
+ throughput/total_tokens=266,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1391/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=267,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1392/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=267,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1393/500000]
+ train/ActionNoiseL2Loss=0.1557
+ throughput/total_tokens=267,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1394/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=267,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1395/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=267,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1396/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=268,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1397/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=268,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1398/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=268,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1399/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=268,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1400/500000]
+ optim/total_grad_norm=2.258
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=268,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1401/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=268,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1402/500000]
+ train/ActionNoiseL2Loss=0.1466
+ throughput/total_tokens=269,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1403/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=269,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1404/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=269,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1405/500000]
+ train/ActionNoiseL2Loss=0.1439
+ throughput/total_tokens=269,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1406/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=269,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1407/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=270,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1408/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=270,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1409/500000]
+ train/ActionNoiseL2Loss=0.1337
+ throughput/total_tokens=270,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1410/500000]
+ train/ActionNoiseL2Loss=0.1837
+ throughput/total_tokens=270,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1411/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=270,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1412/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=271,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1413/500000]
+ train/ActionNoiseL2Loss=0.2411
+ throughput/total_tokens=271,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1414/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=271,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1415/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=271,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1416/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=271,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1417/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=272,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1418/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=272,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1419/500000]
+ train/ActionNoiseL2Loss=0.2011
+ throughput/total_tokens=272,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1420/500000]
+ optim/total_grad_norm=2.742
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=272,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1421/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=272,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1422/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=273,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1423/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=273,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1424/500000]
+ train/ActionNoiseL2Loss=0.2135
+ throughput/total_tokens=273,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1425/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=273,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1426/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=273,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1427/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=273,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1428/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=274,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1429/500000]
+ train/ActionNoiseL2Loss=0.1410
+ throughput/total_tokens=274,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1430/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=274,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1431/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=274,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1432/500000]
+ train/ActionNoiseL2Loss=0.1585
+ throughput/total_tokens=274,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1433/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=275,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1434/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=275,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1435/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=275,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1436/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=275,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1437/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=275,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1438/500000]
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=276,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1439/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=276,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1440/500000]
+ optim/total_grad_norm=2.720
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=276,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1441/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=276,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1442/500000]
+ train/ActionNoiseL2Loss=0.1665
+ throughput/total_tokens=276,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1443/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=277,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1444/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=277,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1445/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=277,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1446/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=277,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1447/500000]
+ train/ActionNoiseL2Loss=0.1546
+ throughput/total_tokens=277,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1448/500000]
+ train/ActionNoiseL2Loss=0.1286
+ throughput/total_tokens=278,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1449/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=278,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1450/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=278,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1451/500000]
+ train/ActionNoiseL2Loss=0.2060
+ throughput/total_tokens=278,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1452/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=278,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1453/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=278,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1454/500000]
+ train/ActionNoiseL2Loss=0.2114
+ throughput/total_tokens=279,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1455/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=279,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1456/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=279,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1457/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=279,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1458/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=279,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1459/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=280,128,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1460/500000]
+ optim/total_grad_norm=3.788
+ train/ActionNoiseL2Loss=0.1497
+ throughput/total_tokens=280,320,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=1461/500000]
+ train/ActionNoiseL2Loss=0.1646
+ throughput/total_tokens=280,512,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1462/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=280,704,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1463/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=280,896,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1464/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=281,088,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1465/500000]
+ train/ActionNoiseL2Loss=0.1534
+ throughput/total_tokens=281,280,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1466/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=281,472,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1467/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=281,664,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1468/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=281,856,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1469/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=282,048,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1470/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=282,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1471/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=282,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1472/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=282,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1473/500000]
+ train/ActionNoiseL2Loss=0.1559
+ throughput/total_tokens=282,816,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1474/500000]
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=283,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1475/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=283,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1476/500000]
+ train/ActionNoiseL2Loss=0.1737
+ throughput/total_tokens=283,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1477/500000]
+ train/ActionNoiseL2Loss=0.1634
+ throughput/total_tokens=283,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1478/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=283,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1479/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=283,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1480/500000]
+ optim/total_grad_norm=2.306
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=284,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1481/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=284,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1482/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=284,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1483/500000]
+ train/ActionNoiseL2Loss=0.1923
+ throughput/total_tokens=284,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1484/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=284,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1485/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=285,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1486/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=285,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1487/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=285,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1488/500000]
+ train/ActionNoiseL2Loss=0.1639
+ throughput/total_tokens=285,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1489/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=285,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1490/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=286,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1491/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=286,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1492/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=286,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1493/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=286,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1494/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=286,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1495/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=287,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1496/500000]
+ train/ActionNoiseL2Loss=0.1538
+ throughput/total_tokens=287,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1497/500000]
+ train/ActionNoiseL2Loss=0.1265
+ throughput/total_tokens=287,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1498/500000]
+ train/ActionNoiseL2Loss=0.2052
+ throughput/total_tokens=287,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1499/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=287,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1500/500000]
+ optim/total_grad_norm=3.919
+ train/ActionNoiseL2Loss=0.1599
+ throughput/total_tokens=288,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+10/12 [01:33:26] INFO | >> Saving config... checkpoint.py:608
+10/12 [01:34:00] INFO | >> Saving model state... checkpoint.py:796
+10/12 [01:35:16] INFO | >> Saving optim state... checkpoint.py:811
+10/12 [01:36:47] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=1501/500000]
+ train/ActionNoiseL2Loss=0.1646
+ throughput/total_tokens=288,192,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=1502/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=288,384,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=1503/500000]
+ train/ActionNoiseL2Loss=0.2414
+ throughput/total_tokens=288,576,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1504/500000]
+ train/ActionNoiseL2Loss=0.2179
+ throughput/total_tokens=288,768,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1505/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=288,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1506/500000]
+ train/ActionNoiseL2Loss=0.2166
+ throughput/total_tokens=289,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1507/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=289,344,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1508/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=289,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1509/500000]
+ train/ActionNoiseL2Loss=0.1684
+ throughput/total_tokens=289,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1510/500000]
+ train/ActionNoiseL2Loss=0.1927
+ throughput/total_tokens=289,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1511/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=290,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1512/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=290,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1513/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=290,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1514/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=290,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1515/500000]
+ train/ActionNoiseL2Loss=0.1692
+ throughput/total_tokens=290,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1516/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=291,072,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1517/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=291,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1518/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=291,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1519/500000]
+ train/ActionNoiseL2Loss=0.1552
+ throughput/total_tokens=291,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1520/500000]
+ optim/total_grad_norm=2.118
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=291,840,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1521/500000]
+ train/ActionNoiseL2Loss=0.1478
+ throughput/total_tokens=292,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1522/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=292,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1523/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=292,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1524/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=292,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1525/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=292,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1526/500000]
+ train/ActionNoiseL2Loss=0.1620
+ throughput/total_tokens=292,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1527/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=293,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1528/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=293,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1529/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=293,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1530/500000]
+ train/ActionNoiseL2Loss=0.1249
+ throughput/total_tokens=293,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1531/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=293,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1532/500000]
+ train/ActionNoiseL2Loss=0.1924
+ throughput/total_tokens=294,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1533/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=294,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1534/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=294,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1535/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=294,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1536/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=294,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1537/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=295,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1538/500000]
+ train/ActionNoiseL2Loss=0.1594
+ throughput/total_tokens=295,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1539/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=295,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1540/500000]
+ optim/total_grad_norm=2.189
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=295,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1541/500000]
+ train/ActionNoiseL2Loss=0.1304
+ throughput/total_tokens=295,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1542/500000]
+ train/ActionNoiseL2Loss=0.1287
+ throughput/total_tokens=296,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1543/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=296,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1544/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=296,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1545/500000]
+ train/ActionNoiseL2Loss=0.1373
+ throughput/total_tokens=296,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1546/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=296,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1547/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=297,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1548/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=297,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1549/500000]
+ train/ActionNoiseL2Loss=0.1544
+ throughput/total_tokens=297,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1550/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=297,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1551/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=297,792,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1552/500000]
+ train/ActionNoiseL2Loss=0.1404
+ throughput/total_tokens=297,984,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1553/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=298,176,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1554/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=298,368,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1555/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=298,560,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1556/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=298,752,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1557/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=298,944,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1558/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=299,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1559/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=299,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1560/500000]
+ optim/total_grad_norm=2.006
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=299,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=1561/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=299,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1562/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=299,904,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1563/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=300,096,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1564/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=300,288,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=1565/500000]
+ train/ActionNoiseL2Loss=0.1424
+ throughput/total_tokens=300,480,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1566/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=300,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1567/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=300,864,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1568/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=301,056,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1569/500000]
+ train/ActionNoiseL2Loss=0.1902
+ throughput/total_tokens=301,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1570/500000]
+ train/ActionNoiseL2Loss=0.1757
+ throughput/total_tokens=301,440,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1571/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=301,632,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1572/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=301,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1573/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=302,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1574/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=302,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1575/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=302,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1576/500000]
+ train/ActionNoiseL2Loss=0.1630
+ throughput/total_tokens=302,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1577/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=302,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1578/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=302,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1579/500000]
+ train/ActionNoiseL2Loss=0.1842
+ throughput/total_tokens=303,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1580/500000]
+ optim/total_grad_norm=2.877
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=303,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1581/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=303,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1582/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=303,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1583/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=303,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1584/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=304,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1585/500000]
+ train/ActionNoiseL2Loss=0.1426
+ throughput/total_tokens=304,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1586/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=304,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1587/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=304,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1588/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=304,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1589/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=305,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1590/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=305,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1591/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=305,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1592/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=305,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1593/500000]
+ train/ActionNoiseL2Loss=0.1317
+ throughput/total_tokens=305,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1594/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=306,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1595/500000]
+ train/ActionNoiseL2Loss=0.1704
+ throughput/total_tokens=306,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1596/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=306,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1597/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=306,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1598/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=306,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1599/500000]
+ train/ActionNoiseL2Loss=0.2017
+ throughput/total_tokens=307,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1600/500000]
+ optim/total_grad_norm=4.006
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=307,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1601/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=307,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1602/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=307,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1603/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=307,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1604/500000]
+ train/ActionNoiseL2Loss=0.1514
+ throughput/total_tokens=307,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1605/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=308,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1606/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=308,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1607/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=308,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1608/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=308,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1609/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=308,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1610/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=309,120,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1611/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=309,312,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1612/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=309,504,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1613/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=309,696,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1614/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=309,888,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1615/500000]
+ train/ActionNoiseL2Loss=0.1289
+ throughput/total_tokens=310,080,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1616/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=310,272,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1617/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=310,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1618/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=310,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1619/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=310,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1620/500000]
+ optim/total_grad_norm=2.095
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=311,040,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,073
+[step=1621/500000]
+ train/ActionNoiseL2Loss=0.1732
+ throughput/total_tokens=311,232,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1622/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=311,424,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1623/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=311,616,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1624/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=311,808,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1625/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=312,000,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1626/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=312,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1627/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=312,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1628/500000]
+ train/ActionNoiseL2Loss=0.2029
+ throughput/total_tokens=312,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1629/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=312,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1630/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=312,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,073
+[step=1631/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=313,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1632/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=313,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1633/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=313,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1634/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=313,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1635/500000]
+ train/ActionNoiseL2Loss=0.1473
+ throughput/total_tokens=313,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1636/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=314,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1637/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=314,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1638/500000]
+ train/ActionNoiseL2Loss=0.2118
+ throughput/total_tokens=314,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1639/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=314,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1640/500000]
+ optim/total_grad_norm=2.660
+ train/ActionNoiseL2Loss=0.1487
+ throughput/total_tokens=314,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,073
+[step=1641/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=315,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1642/500000]
+ train/ActionNoiseL2Loss=0.2021
+ throughput/total_tokens=315,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1643/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=315,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1644/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=315,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1645/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=315,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1646/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=316,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1647/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=316,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1648/500000]
+ train/ActionNoiseL2Loss=0.1576
+ throughput/total_tokens=316,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1649/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=316,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1650/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=316,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1651/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=316,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1652/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=317,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1653/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=317,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1654/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=317,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1655/500000]
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=317,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1656/500000]
+ train/ActionNoiseL2Loss=0.1691
+ throughput/total_tokens=317,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1657/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=318,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1658/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=318,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1659/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=318,528,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1660/500000]
+ optim/total_grad_norm=2.157
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=318,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,073
+[step=1661/500000]
+ train/ActionNoiseL2Loss=0.1793
+ throughput/total_tokens=318,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1662/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=319,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1663/500000]
+ train/ActionNoiseL2Loss=0.1730
+ throughput/total_tokens=319,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1664/500000]
+ train/ActionNoiseL2Loss=0.1886
+ throughput/total_tokens=319,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1665/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=319,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1666/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=319,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1667/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=320,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1668/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=320,256,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1669/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=320,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1670/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=320,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1671/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=320,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1672/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=321,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1673/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=321,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1674/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=321,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1675/500000]
+ train/ActionNoiseL2Loss=0.1422
+ throughput/total_tokens=321,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1676/500000]
+ train/ActionNoiseL2Loss=0.1706
+ throughput/total_tokens=321,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1677/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=321,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1678/500000]
+ train/ActionNoiseL2Loss=0.1242
+ throughput/total_tokens=322,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1679/500000]
+ train/ActionNoiseL2Loss=0.1428
+ throughput/total_tokens=322,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1680/500000]
+ optim/total_grad_norm=1.943
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=322,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,073
+[step=1681/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=322,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1682/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=322,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1683/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=323,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1684/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=323,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1685/500000]
+ train/ActionNoiseL2Loss=0.1654
+ throughput/total_tokens=323,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1686/500000]
+ train/ActionNoiseL2Loss=0.1263
+ throughput/total_tokens=323,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1687/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=323,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1688/500000]
+ train/ActionNoiseL2Loss=0.1692
+ throughput/total_tokens=324,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1689/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=324,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1690/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=324,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1691/500000]
+ train/ActionNoiseL2Loss=0.1503
+ throughput/total_tokens=324,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1692/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=324,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1693/500000]
+ train/ActionNoiseL2Loss=0.1465
+ throughput/total_tokens=325,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1694/500000]
+ train/ActionNoiseL2Loss=0.1280
+ throughput/total_tokens=325,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1695/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=325,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1696/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=325,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1697/500000]
+ train/ActionNoiseL2Loss=0.1757
+ throughput/total_tokens=325,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1698/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=326,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1699/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=326,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1700/500000]
+ optim/total_grad_norm=3.400
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=326,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1701/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=326,592,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=1702/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=326,784,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=1703/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=326,976,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=1704/500000]
+ train/ActionNoiseL2Loss=0.1640
+ throughput/total_tokens=327,168,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=1705/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=327,360,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=1706/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=327,552,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1707/500000]
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=327,744,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1708/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=327,936,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1709/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=328,128,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1710/500000]
+ train/ActionNoiseL2Loss=0.1387
+ throughput/total_tokens=328,320,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+ System/Peak GPU Memory (MB)=51,073
+[step=1711/500000]
+ train/ActionNoiseL2Loss=0.1639
+ throughput/total_tokens=328,512,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1712/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=328,704,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1713/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=328,896,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1714/500000]
+ train/ActionNoiseL2Loss=0.2330
+ throughput/total_tokens=329,088,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1715/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=329,280,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1716/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=329,472,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1717/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=329,664,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1718/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=329,856,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1719/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=330,048,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=1720/500000]
+ optim/total_grad_norm=3.619
+ train/ActionNoiseL2Loss=0.1873
+ throughput/total_tokens=330,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1721/500000]
+ train/ActionNoiseL2Loss=0.1398
+ throughput/total_tokens=330,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1722/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=330,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1723/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=330,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1724/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=331,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1725/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=331,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1726/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=331,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1727/500000]
+ train/ActionNoiseL2Loss=0.1388
+ throughput/total_tokens=331,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1728/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=331,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1729/500000]
+ train/ActionNoiseL2Loss=0.1295
+ throughput/total_tokens=331,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1730/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=332,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1731/500000]
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=332,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1732/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=332,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1733/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=332,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1734/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=332,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1735/500000]
+ train/ActionNoiseL2Loss=0.1455
+ throughput/total_tokens=333,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1736/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=333,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1737/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=333,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1738/500000]
+ train/ActionNoiseL2Loss=0.1812
+ throughput/total_tokens=333,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1739/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=333,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1740/500000]
+ optim/total_grad_norm=1.986
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=334,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1741/500000]
+ train/ActionNoiseL2Loss=0.1496
+ throughput/total_tokens=334,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1742/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=334,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1743/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=334,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1744/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=334,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1745/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=335,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1746/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=335,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1747/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=335,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1748/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=335,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1749/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=335,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1750/500000]
+ train/ActionNoiseL2Loss=0.2077
+ throughput/total_tokens=336,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1751/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=336,192,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1752/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=336,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1753/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=336,576,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1754/500000]
+ train/ActionNoiseL2Loss=0.1671
+ throughput/total_tokens=336,768,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1755/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=336,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1756/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=337,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1757/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=337,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1758/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=337,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1759/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=337,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1760/500000]
+ optim/total_grad_norm=1.550
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=337,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1761/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=338,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1762/500000]
+ train/ActionNoiseL2Loss=0.1419
+ throughput/total_tokens=338,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1763/500000]
+ train/ActionNoiseL2Loss=0.1643
+ throughput/total_tokens=338,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1764/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=338,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1765/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=338,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1766/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=339,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1767/500000]
+ train/ActionNoiseL2Loss=0.1171
+ throughput/total_tokens=339,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1768/500000]
+ train/ActionNoiseL2Loss=0.1309
+ throughput/total_tokens=339,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1769/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=339,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1770/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=339,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1771/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=340,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1772/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=340,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1773/500000]
+ train/ActionNoiseL2Loss=0.2229
+ throughput/total_tokens=340,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1774/500000]
+ train/ActionNoiseL2Loss=0.1665
+ throughput/total_tokens=340,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1775/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=340,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1776/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=340,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1777/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=341,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1778/500000]
+ train/ActionNoiseL2Loss=0.1587
+ throughput/total_tokens=341,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1779/500000]
+ train/ActionNoiseL2Loss=0.2274
+ throughput/total_tokens=341,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1780/500000]
+ optim/total_grad_norm=2.185
+ train/ActionNoiseL2Loss=0.1360
+ throughput/total_tokens=341,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1781/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=341,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1782/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=342,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1783/500000]
+ train/ActionNoiseL2Loss=0.1914
+ throughput/total_tokens=342,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1784/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=342,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1785/500000]
+ train/ActionNoiseL2Loss=0.2020
+ throughput/total_tokens=342,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1786/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=342,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1787/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=343,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1788/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=343,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1789/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=343,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1790/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=343,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1791/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=343,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1792/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=344,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1793/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=344,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1794/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=344,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1795/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=344,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1796/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=344,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1797/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=345,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1798/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=345,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1799/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=345,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1800/500000]
+ optim/total_grad_norm=2.166
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=345,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1801/500000]
+ train/ActionNoiseL2Loss=0.1454
+ throughput/total_tokens=345,792,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1802/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=345,984,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1803/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=346,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1804/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=346,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1805/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=346,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1806/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=346,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1807/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=346,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1808/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=347,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1809/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=347,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1810/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=347,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1811/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=347,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=1812/500000]
+ train/ActionNoiseL2Loss=0.1442
+ throughput/total_tokens=347,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1813/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=348,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1814/500000]
+ train/ActionNoiseL2Loss=0.1671
+ throughput/total_tokens=348,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1815/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=348,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1816/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=348,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1817/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=348,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1818/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=349,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1819/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=349,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1820/500000]
+ optim/total_grad_norm=3.376
+ train/ActionNoiseL2Loss=0.1663
+ throughput/total_tokens=349,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1821/500000]
+ train/ActionNoiseL2Loss=0.1774
+ throughput/total_tokens=349,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1822/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=349,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1823/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=350,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1824/500000]
+ train/ActionNoiseL2Loss=0.1412
+ throughput/total_tokens=350,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1825/500000]
+ train/ActionNoiseL2Loss=0.1512
+ throughput/total_tokens=350,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1826/500000]
+ train/ActionNoiseL2Loss=0.2179
+ throughput/total_tokens=350,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1827/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=350,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1828/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=350,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1829/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=351,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1830/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=351,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1831/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=351,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1832/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=351,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1833/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=351,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1834/500000]
+ train/ActionNoiseL2Loss=0.1782
+ throughput/total_tokens=352,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1835/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=352,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1836/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=352,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1837/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=352,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1838/500000]
+ train/ActionNoiseL2Loss=0.1354
+ throughput/total_tokens=352,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1839/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=353,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1840/500000]
+ optim/total_grad_norm=2.808
+ train/ActionNoiseL2Loss=0.1676
+ throughput/total_tokens=353,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1841/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=353,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1842/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=353,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1843/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=353,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1844/500000]
+ train/ActionNoiseL2Loss=0.2318
+ throughput/total_tokens=354,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1845/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=354,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1846/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=354,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1847/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=354,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1848/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=354,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1849/500000]
+ train/ActionNoiseL2Loss=0.1429
+ throughput/total_tokens=355,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1850/500000]
+ train/ActionNoiseL2Loss=0.1857
+ throughput/total_tokens=355,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1851/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=355,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1852/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=355,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1853/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=355,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1854/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=355,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1855/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=356,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1856/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=356,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1857/500000]
+ train/ActionNoiseL2Loss=0.1796
+ throughput/total_tokens=356,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1858/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=356,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1859/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=356,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1860/500000]
+ optim/total_grad_norm=3.451
+ train/ActionNoiseL2Loss=0.1860
+ throughput/total_tokens=357,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1861/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=357,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1862/500000]
+ train/ActionNoiseL2Loss=0.1648
+ throughput/total_tokens=357,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=1863/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=357,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1864/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=357,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1865/500000]
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=358,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1866/500000]
+ train/ActionNoiseL2Loss=0.1932
+ throughput/total_tokens=358,272,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1867/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=358,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1868/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=358,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1869/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=358,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=1870/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=359,040,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,073
+[step=1871/500000]
+ train/ActionNoiseL2Loss=0.1596
+ throughput/total_tokens=359,232,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1872/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=359,424,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1873/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=359,616,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1874/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=359,808,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1875/500000]
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=360,000,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=1876/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=360,192,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=1877/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=360,384,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=1878/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=360,576,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=1879/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=360,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1880/500000]
+ optim/total_grad_norm=1.768
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=360,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,073
+[step=1881/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=361,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1882/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=361,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1883/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=361,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1884/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=361,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=1885/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=361,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1886/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=362,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=1887/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=362,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1888/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=362,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1889/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=362,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1890/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=362,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1891/500000]
+ train/ActionNoiseL2Loss=0.1978
+ throughput/total_tokens=363,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1892/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=363,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1893/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=363,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1894/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=363,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1895/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=363,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1896/500000]
+ train/ActionNoiseL2Loss=0.1875
+ throughput/total_tokens=364,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1897/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=364,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1898/500000]
+ train/ActionNoiseL2Loss=0.1357
+ throughput/total_tokens=364,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1899/500000]
+ train/ActionNoiseL2Loss=0.1968
+ throughput/total_tokens=364,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=1900/500000]
+ optim/total_grad_norm=1.617
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=364,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1901/500000]
+ train/ActionNoiseL2Loss=0.2366
+ throughput/total_tokens=364,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1902/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=365,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1903/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=365,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1904/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=365,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1905/500000]
+ train/ActionNoiseL2Loss=0.1696
+ throughput/total_tokens=365,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1906/500000]
+ train/ActionNoiseL2Loss=0.1482
+ throughput/total_tokens=365,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1907/500000]
+ train/ActionNoiseL2Loss=0.1239
+ throughput/total_tokens=366,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1908/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=366,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1909/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=366,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1910/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=366,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+[step=1911/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=366,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1912/500000]
+ train/ActionNoiseL2Loss=0.1590
+ throughput/total_tokens=367,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1913/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=367,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=1914/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=367,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1915/500000]
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=367,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1916/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=367,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1917/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=368,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1918/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=368,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1919/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=368,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=1920/500000]
+ optim/total_grad_norm=2.538
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=368,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1921/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=368,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1922/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=369,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1923/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=369,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1924/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=369,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1925/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=369,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1926/500000]
+ train/ActionNoiseL2Loss=0.1603
+ throughput/total_tokens=369,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1927/500000]
+ train/ActionNoiseL2Loss=0.1582
+ throughput/total_tokens=369,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1928/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=370,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1929/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=370,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1930/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=370,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1931/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=370,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1932/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=370,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1933/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=371,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1934/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=371,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1935/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=371,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1936/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=371,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1937/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=371,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1938/500000]
+ train/ActionNoiseL2Loss=0.1559
+ throughput/total_tokens=372,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1939/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=372,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1940/500000]
+ optim/total_grad_norm=1.969
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=372,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1941/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=372,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1942/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=372,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1943/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=373,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1944/500000]
+ train/ActionNoiseL2Loss=0.1278
+ throughput/total_tokens=373,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1945/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=373,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1946/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=373,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1947/500000]
+ train/ActionNoiseL2Loss=0.1450
+ throughput/total_tokens=373,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1948/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=374,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1949/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=374,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1950/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=374,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1951/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=374,592,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1952/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=374,784,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1953/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=374,976,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1954/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=375,168,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1955/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=375,360,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1956/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=375,552,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1957/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=375,744,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1958/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=375,936,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1959/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=376,128,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1960/500000]
+ optim/total_grad_norm=2.404
+ train/ActionNoiseL2Loss=0.1399
+ throughput/total_tokens=376,320,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,073
+[step=1961/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=376,512,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1962/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=376,704,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1963/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=376,896,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1964/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=377,088,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1965/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=377,280,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1966/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=377,472,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1967/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=377,664,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1968/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=377,856,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1969/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=378,048,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=1970/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=378,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1971/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=378,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1972/500000]
+ train/ActionNoiseL2Loss=0.1908
+ throughput/total_tokens=378,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1973/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=378,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1974/500000]
+ train/ActionNoiseL2Loss=0.2044
+ throughput/total_tokens=379,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1975/500000]
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=379,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1976/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=379,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1977/500000]
+ train/ActionNoiseL2Loss=0.1348
+ throughput/total_tokens=379,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1978/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=379,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1979/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=379,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1980/500000]
+ optim/total_grad_norm=2.167
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=380,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1981/500000]
+ train/ActionNoiseL2Loss=0.1673
+ throughput/total_tokens=380,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1982/500000]
+ train/ActionNoiseL2Loss=0.1444
+ throughput/total_tokens=380,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1983/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=380,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1984/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=380,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1985/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=381,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1986/500000]
+ train/ActionNoiseL2Loss=0.1687
+ throughput/total_tokens=381,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=1987/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=381,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1988/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=381,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1989/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=381,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=1990/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=382,080,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,073
+[step=1991/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=382,272,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1992/500000]
+ train/ActionNoiseL2Loss=0.1253
+ throughput/total_tokens=382,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1993/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=382,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1994/500000]
+ train/ActionNoiseL2Loss=0.1155
+ throughput/total_tokens=382,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1995/500000]
+ train/ActionNoiseL2Loss=0.1560
+ throughput/total_tokens=383,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1996/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=383,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1997/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=383,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1998/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=383,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=1999/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=383,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2000/500000]
+ optim/total_grad_norm=1.500
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=384,000,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,073
+10/12 [04:32:21] INFO | >> Saving config... checkpoint.py:608
+10/12 [04:32:54] INFO | >> Saving model state... checkpoint.py:796
+10/12 [04:34:02] INFO | >> Saving optim state... checkpoint.py:811
+10/12 [04:35:36] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2001/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=384,192,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0473
+[step=2002/500000]
+ train/ActionNoiseL2Loss=0.1648
+ throughput/total_tokens=384,384,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=2003/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=384,576,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=2004/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=384,768,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2005/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=384,960,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2006/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=385,152,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2007/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=385,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2008/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=385,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2009/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=385,728,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2010/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=385,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2011/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=386,112,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2012/500000]
+ train/ActionNoiseL2Loss=0.1767
+ throughput/total_tokens=386,304,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2013/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=386,496,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2014/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=386,688,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2015/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=386,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2016/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=387,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2017/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=387,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2018/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=387,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2019/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=387,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2020/500000]
+ optim/total_grad_norm=1.880
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=387,840,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=2021/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=388,032,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2022/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=388,224,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2023/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=388,416,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2024/500000]
+ train/ActionNoiseL2Loss=0.1334
+ throughput/total_tokens=388,608,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2025/500000]
+ train/ActionNoiseL2Loss=0.1327
+ throughput/total_tokens=388,800,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2026/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=388,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2027/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=389,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2028/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=389,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2029/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=389,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2030/500000]
+ train/ActionNoiseL2Loss=0.1319
+ throughput/total_tokens=389,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2031/500000]
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=389,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2032/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=390,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2033/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=390,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2034/500000]
+ train/ActionNoiseL2Loss=0.1676
+ throughput/total_tokens=390,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2035/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=390,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2036/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=390,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2037/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=391,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2038/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=391,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2039/500000]
+ train/ActionNoiseL2Loss=0.1779
+ throughput/total_tokens=391,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2040/500000]
+ optim/total_grad_norm=2.682
+ train/ActionNoiseL2Loss=0.1643
+ throughput/total_tokens=391,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2041/500000]
+ train/ActionNoiseL2Loss=0.1608
+ throughput/total_tokens=391,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2042/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=392,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2043/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=392,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2044/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=392,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2045/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=392,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2046/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=392,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2047/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=393,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2048/500000]
+ train/ActionNoiseL2Loss=0.1675
+ throughput/total_tokens=393,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2049/500000]
+ train/ActionNoiseL2Loss=0.1304
+ throughput/total_tokens=393,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2050/500000]
+ train/ActionNoiseL2Loss=0.1405
+ throughput/total_tokens=393,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2051/500000]
+ train/ActionNoiseL2Loss=0.1369
+ throughput/total_tokens=393,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2052/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=393,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2053/500000]
+ train/ActionNoiseL2Loss=0.1467
+ throughput/total_tokens=394,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2054/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=394,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2055/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=394,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2056/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=394,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2057/500000]
+ train/ActionNoiseL2Loss=0.1663
+ throughput/total_tokens=394,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2058/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=395,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2059/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=395,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2060/500000]
+ optim/total_grad_norm=1.556
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=395,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2061/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=395,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2062/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=395,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2063/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=396,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2064/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=396,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2065/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=396,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2066/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=396,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2067/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=396,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2068/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=397,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2069/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=397,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2070/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=397,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2071/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=397,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2072/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=397,824,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2073/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=398,016,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2074/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=398,208,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2075/500000]
+ train/ActionNoiseL2Loss=0.1381
+ throughput/total_tokens=398,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2076/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=398,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2077/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=398,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2078/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=398,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2079/500000]
+ train/ActionNoiseL2Loss=0.1379
+ throughput/total_tokens=399,168,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2080/500000]
+ optim/total_grad_norm=1.812
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=399,360,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2081/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=399,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2082/500000]
+ train/ActionNoiseL2Loss=0.1544
+ throughput/total_tokens=399,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2083/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=399,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2084/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=400,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2085/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=400,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2086/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=400,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2087/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=400,704,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2088/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=400,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2089/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=401,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2090/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=401,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2091/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=401,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2092/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=401,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2093/500000]
+ train/ActionNoiseL2Loss=0.1542
+ throughput/total_tokens=401,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2094/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=402,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2095/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=402,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2096/500000]
+ train/ActionNoiseL2Loss=0.1229
+ throughput/total_tokens=402,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2097/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=402,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2098/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=402,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2099/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=403,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2100/500000]
+ optim/total_grad_norm=1.479
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=403,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2101/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=403,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2102/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=403,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2103/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=403,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2104/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=403,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2105/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=404,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2106/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=404,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2107/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=404,544,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2108/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=404,736,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2109/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=404,928,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2110/500000]
+ train/ActionNoiseL2Loss=0.1378
+ throughput/total_tokens=405,120,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=2111/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=405,312,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2112/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=405,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2113/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=405,696,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2114/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=405,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2115/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=406,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2116/500000]
+ train/ActionNoiseL2Loss=0.1281
+ throughput/total_tokens=406,272,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2117/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=406,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2118/500000]
+ train/ActionNoiseL2Loss=0.1316
+ throughput/total_tokens=406,656,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2119/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=406,848,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2120/500000]
+ optim/total_grad_norm=0.9637
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=407,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2121/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=407,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2122/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=407,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2123/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=407,616,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2124/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=407,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2125/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=408,000,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2126/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=408,192,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2127/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=408,384,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2128/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=408,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2129/500000]
+ train/ActionNoiseL2Loss=0.1523
+ throughput/total_tokens=408,768,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2130/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=408,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2131/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=409,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2132/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=409,344,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2133/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=409,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2134/500000]
+ train/ActionNoiseL2Loss=0.1571
+ throughput/total_tokens=409,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2135/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=409,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2136/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=410,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2137/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=410,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2138/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=410,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2139/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=410,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2140/500000]
+ optim/total_grad_norm=2.286
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=410,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2141/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=411,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2142/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=411,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2143/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=411,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2144/500000]
+ train/ActionNoiseL2Loss=0.1430
+ throughput/total_tokens=411,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2145/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=411,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2146/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=412,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2147/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=412,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2148/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=412,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2149/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=412,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2150/500000]
+ train/ActionNoiseL2Loss=0.2024
+ throughput/total_tokens=412,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2151/500000]
+ train/ActionNoiseL2Loss=0.1481
+ throughput/total_tokens=412,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2152/500000]
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=413,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2153/500000]
+ train/ActionNoiseL2Loss=0.1304
+ throughput/total_tokens=413,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2154/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=413,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2155/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=413,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2156/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=413,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2157/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=414,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2158/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=414,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2159/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=414,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2160/500000]
+ optim/total_grad_norm=1.572
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=414,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2161/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=414,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2162/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=415,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2163/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=415,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2164/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=415,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2165/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=415,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2166/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=415,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2167/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=416,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2168/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=416,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2169/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=416,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2170/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=416,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2171/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=416,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2172/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=417,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2173/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=417,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2174/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=417,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2175/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=417,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2176/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=417,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2177/500000]
+ train/ActionNoiseL2Loss=0.1797
+ throughput/total_tokens=417,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2178/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=418,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2179/500000]
+ train/ActionNoiseL2Loss=0.1873
+ throughput/total_tokens=418,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2180/500000]
+ optim/total_grad_norm=1.903
+ train/ActionNoiseL2Loss=0.1161
+ throughput/total_tokens=418,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2181/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=418,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2182/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=418,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2183/500000]
+ train/ActionNoiseL2Loss=0.1280
+ throughput/total_tokens=419,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2184/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=419,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2185/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=419,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2186/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=419,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2187/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=419,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2188/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=420,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2189/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=420,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2190/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=420,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2191/500000]
+ train/ActionNoiseL2Loss=0.1195
+ throughput/total_tokens=420,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2192/500000]
+ train/ActionNoiseL2Loss=0.1456
+ throughput/total_tokens=420,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2193/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=421,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2194/500000]
+ train/ActionNoiseL2Loss=0.1611
+ throughput/total_tokens=421,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2195/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=421,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2196/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=421,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2197/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=421,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2198/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=422,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2199/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=422,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2200/500000]
+ optim/total_grad_norm=2.178
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=422,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2201/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=422,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2202/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=422,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2203/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=422,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2204/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=423,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2205/500000]
+ train/ActionNoiseL2Loss=0.1826
+ throughput/total_tokens=423,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2206/500000]
+ train/ActionNoiseL2Loss=0.1305
+ throughput/total_tokens=423,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2207/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=423,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2208/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=423,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2209/500000]
+ train/ActionNoiseL2Loss=0.1591
+ throughput/total_tokens=424,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2210/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=424,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2211/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=424,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2212/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=424,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2213/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=424,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2214/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=425,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2215/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=425,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2216/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=425,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2217/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=425,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2218/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=425,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2219/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=426,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2220/500000]
+ optim/total_grad_norm=1.756
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=426,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2221/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=426,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2222/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=426,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2223/500000]
+ train/ActionNoiseL2Loss=0.1652
+ throughput/total_tokens=426,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2224/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=427,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2225/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=427,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2226/500000]
+ train/ActionNoiseL2Loss=0.1718
+ throughput/total_tokens=427,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2227/500000]
+ train/ActionNoiseL2Loss=0.1347
+ throughput/total_tokens=427,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2228/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=427,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2229/500000]
+ train/ActionNoiseL2Loss=0.1136
+ throughput/total_tokens=427,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2230/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=428,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2231/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=428,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2232/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=428,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2233/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=428,736,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2234/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=428,928,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2235/500000]
+ train/ActionNoiseL2Loss=0.1690
+ throughput/total_tokens=429,120,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2236/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=429,312,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2237/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=429,504,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2238/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=429,696,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2239/500000]
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=429,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2240/500000]
+ optim/total_grad_norm=2.026
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=430,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2241/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=430,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2242/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=430,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2243/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=430,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2244/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=430,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2245/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=431,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2246/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=431,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2247/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=431,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2248/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=431,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2249/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=431,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2250/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=432,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2251/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=432,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2252/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=432,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2253/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=432,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2254/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=432,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2255/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=432,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2256/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=433,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2257/500000]
+ train/ActionNoiseL2Loss=0.1421
+ throughput/total_tokens=433,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2258/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=433,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2259/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=433,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2260/500000]
+ optim/total_grad_norm=1.254
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=433,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2261/500000]
+ train/ActionNoiseL2Loss=0.1509
+ throughput/total_tokens=434,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2262/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=434,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2263/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=434,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2264/500000]
+ train/ActionNoiseL2Loss=0.1775
+ throughput/total_tokens=434,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2265/500000]
+ train/ActionNoiseL2Loss=0.1616
+ throughput/total_tokens=434,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2266/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=435,072,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2267/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=435,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2268/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=435,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2269/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=435,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2270/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=435,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2271/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=436,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2272/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=436,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2273/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=436,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2274/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=436,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2275/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=436,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2276/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=436,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2277/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=437,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2278/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=437,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2279/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=437,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2280/500000]
+ optim/total_grad_norm=1.671
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=437,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2281/500000]
+ train/ActionNoiseL2Loss=0.1472
+ throughput/total_tokens=437,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2282/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=438,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2283/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=438,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2284/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=438,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2285/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=438,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2286/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=438,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2287/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=439,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2288/500000]
+ train/ActionNoiseL2Loss=0.1500
+ throughput/total_tokens=439,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2289/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=439,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2290/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=439,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2291/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=439,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2292/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=440,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2293/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=440,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2294/500000]
+ train/ActionNoiseL2Loss=0.1543
+ throughput/total_tokens=440,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2295/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=440,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2296/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=440,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2297/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=441,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2298/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=441,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2299/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=441,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2300/500000]
+ optim/total_grad_norm=2.171
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=441,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2301/500000]
+ train/ActionNoiseL2Loss=0.1452
+ throughput/total_tokens=441,792,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2302/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=441,984,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2303/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=442,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2304/500000]
+ train/ActionNoiseL2Loss=0.1962
+ throughput/total_tokens=442,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2305/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=442,560,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2306/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=442,752,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2307/500000]
+ train/ActionNoiseL2Loss=0.1114
+ throughput/total_tokens=442,944,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2308/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=443,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2309/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=443,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2310/500000]
+ train/ActionNoiseL2Loss=0.1342
+ throughput/total_tokens=443,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=2311/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=443,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2312/500000]
+ train/ActionNoiseL2Loss=0.1161
+ throughput/total_tokens=443,904,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2313/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=444,096,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2314/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=444,288,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2315/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=444,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2316/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=444,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2317/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=444,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2318/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=445,056,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2319/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=445,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2320/500000]
+ optim/total_grad_norm=1.396
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=445,440,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2321/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=445,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2322/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=445,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2323/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=446,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2324/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=446,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2325/500000]
+ train/ActionNoiseL2Loss=0.1673
+ throughput/total_tokens=446,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2326/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=446,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2327/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=446,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2328/500000]
+ train/ActionNoiseL2Loss=0.1384
+ throughput/total_tokens=446,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2329/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=447,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2330/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=447,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2331/500000]
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=447,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2332/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=447,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2333/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=447,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2334/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=448,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2335/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=448,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2336/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=448,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2337/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=448,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2338/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=448,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2339/500000]
+ train/ActionNoiseL2Loss=0.1489
+ throughput/total_tokens=449,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2340/500000]
+ optim/total_grad_norm=1.676
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=449,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2341/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=449,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2342/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=449,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2343/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=449,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2344/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=450,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2345/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=450,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2346/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=450,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2347/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=450,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2348/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=450,816,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2349/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=451,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2350/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=451,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2351/500000]
+ train/ActionNoiseL2Loss=0.1436
+ throughput/total_tokens=451,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2352/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=451,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2353/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=451,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2354/500000]
+ train/ActionNoiseL2Loss=0.1879
+ throughput/total_tokens=451,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2355/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=452,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2356/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=452,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2357/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=452,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2358/500000]
+ train/ActionNoiseL2Loss=0.1284
+ throughput/total_tokens=452,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2359/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=452,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2360/500000]
+ optim/total_grad_norm=2.983
+ train/ActionNoiseL2Loss=0.1271
+ throughput/total_tokens=453,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2361/500000]
+ train/ActionNoiseL2Loss=0.1356
+ throughput/total_tokens=453,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2362/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=453,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2363/500000]
+ train/ActionNoiseL2Loss=0.1127
+ throughput/total_tokens=453,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2364/500000]
+ train/ActionNoiseL2Loss=0.1324
+ throughput/total_tokens=453,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2365/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=454,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2366/500000]
+ train/ActionNoiseL2Loss=0.1395
+ throughput/total_tokens=454,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2367/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=454,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2368/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=454,656,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2369/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=454,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2370/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=455,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2371/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=455,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2372/500000]
+ train/ActionNoiseL2Loss=0.1493
+ throughput/total_tokens=455,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2373/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=455,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2374/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=455,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2375/500000]
+ train/ActionNoiseL2Loss=0.1761
+ throughput/total_tokens=456,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2376/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=456,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2377/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=456,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2378/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=456,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2379/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=456,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2380/500000]
+ optim/total_grad_norm=1.710
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=456,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2381/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=457,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2382/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=457,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2383/500000]
+ train/ActionNoiseL2Loss=0.1517
+ throughput/total_tokens=457,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2384/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=457,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2385/500000]
+ train/ActionNoiseL2Loss=0.1498
+ throughput/total_tokens=457,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2386/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=458,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2387/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=458,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2388/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=458,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2389/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=458,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2390/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=458,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2391/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=459,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2392/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=459,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2393/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=459,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2394/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=459,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2395/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=459,840,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2396/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=460,032,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2397/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=460,224,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2398/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=460,416,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2399/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=460,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2400/500000]
+ optim/total_grad_norm=1.705
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=460,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2401/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=460,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2402/500000]
+ train/ActionNoiseL2Loss=0.1391
+ throughput/total_tokens=461,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2403/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=461,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2404/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=461,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2405/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=461,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2406/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=461,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2407/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=462,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2408/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=462,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2409/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=462,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2410/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=462,720,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=2411/500000]
+ train/ActionNoiseL2Loss=0.1570
+ throughput/total_tokens=462,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2412/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=463,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2413/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=463,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2414/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=463,488,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2415/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=463,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2416/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=463,872,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=2417/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=464,064,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=2418/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=464,256,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=2419/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=464,448,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2420/500000]
+ optim/total_grad_norm=2.394
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=464,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2421/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=464,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2422/500000]
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=465,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2423/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=465,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2424/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=465,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2425/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=465,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2426/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=465,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2427/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=465,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2428/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=466,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2429/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=466,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2430/500000]
+ train/ActionNoiseL2Loss=0.1914
+ throughput/total_tokens=466,560,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2431/500000]
+ train/ActionNoiseL2Loss=0.1199
+ throughput/total_tokens=466,752,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2432/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=466,944,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2433/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=467,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2434/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=467,328,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2435/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=467,520,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2436/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=467,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2437/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=467,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2438/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=468,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2439/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=468,288,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2440/500000]
+ optim/total_grad_norm=1.498
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=468,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2441/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=468,672,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2442/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=468,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2443/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=469,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2444/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=469,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2445/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=469,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2446/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=469,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2447/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=469,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2448/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=470,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2449/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=470,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2450/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=470,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2451/500000]
+ train/ActionNoiseL2Loss=0.1311
+ throughput/total_tokens=470,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2452/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=470,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2453/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=470,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2454/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=471,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2455/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=471,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2456/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=471,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2457/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=471,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2458/500000]
+ train/ActionNoiseL2Loss=0.1446
+ throughput/total_tokens=471,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2459/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=472,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2460/500000]
+ optim/total_grad_norm=1.420
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=472,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2461/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=472,512,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2462/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=472,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2463/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=472,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2464/500000]
+ train/ActionNoiseL2Loss=0.1600
+ throughput/total_tokens=473,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2465/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=473,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2466/500000]
+ train/ActionNoiseL2Loss=0.1447
+ throughput/total_tokens=473,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2467/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=473,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2468/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=473,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2469/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=474,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2470/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=474,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2471/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=474,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2472/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=474,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2473/500000]
+ train/ActionNoiseL2Loss=0.1321
+ throughput/total_tokens=474,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2474/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=475,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2475/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=475,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2476/500000]
+ train/ActionNoiseL2Loss=0.1211
+ throughput/total_tokens=475,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2477/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=475,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2478/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=475,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2479/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=475,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2480/500000]
+ optim/total_grad_norm=1.053
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=476,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2481/500000]
+ train/ActionNoiseL2Loss=0.1257
+ throughput/total_tokens=476,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2482/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=476,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2483/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=476,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2484/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=476,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2485/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=477,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2486/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=477,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2487/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=477,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2488/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=477,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2489/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=477,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2490/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=478,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2491/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=478,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2492/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=478,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2493/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=478,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2494/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=478,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2495/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=479,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2496/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=479,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2497/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=479,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2498/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=479,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2499/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=479,808,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2500/500000]
+ optim/total_grad_norm=1.915
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=480,000,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+10/12 [07:31:01] INFO | >> Saving config... checkpoint.py:608
+10/12 [07:31:34] INFO | >> Saving model state... checkpoint.py:796
+10/12 [07:32:46] INFO | >> Saving optim state... checkpoint.py:811
+10/12 [07:34:18] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=2501/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=480,192,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=2502/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=480,384,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=2503/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=480,576,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=2504/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=480,768,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=2505/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=480,960,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=2506/500000]
+ train/ActionNoiseL2Loss=0.1340
+ throughput/total_tokens=481,152,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=2507/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=481,344,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=2508/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=481,536,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=2509/500000]
+ train/ActionNoiseL2Loss=0.1179
+ throughput/total_tokens=481,728,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=2510/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=481,920,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,074
+[step=2511/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=482,112,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=2512/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=482,304,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=2513/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=482,496,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=2514/500000]
+ train/ActionNoiseL2Loss=0.1179
+ throughput/total_tokens=482,688,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=2515/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=482,880,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2516/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=483,072,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2517/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=483,264,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2518/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=483,456,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2519/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=483,648,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2520/500000]
+ optim/total_grad_norm=1.745
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=483,840,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=2521/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=484,032,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2522/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=484,224,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2523/500000]
+ train/ActionNoiseL2Loss=0.1476
+ throughput/total_tokens=484,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2524/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=484,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2525/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=484,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2526/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=484,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2527/500000]
+ train/ActionNoiseL2Loss=0.1208
+ throughput/total_tokens=485,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2528/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=485,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2529/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=485,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2530/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=485,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2531/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=485,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2532/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=486,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2533/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=486,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2534/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=486,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2535/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=486,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2536/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=486,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2537/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=487,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2538/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=487,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2539/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=487,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2540/500000]
+ optim/total_grad_norm=2.253
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=487,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2541/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=487,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2542/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=488,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2543/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=488,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2544/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=488,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2545/500000]
+ train/ActionNoiseL2Loss=0.1190
+ throughput/total_tokens=488,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2546/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=488,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2547/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=489,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2548/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=489,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2549/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=489,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2550/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=489,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2551/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=489,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2552/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=489,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2553/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=490,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2554/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=490,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2555/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=490,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2556/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=490,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2557/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=490,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2558/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=491,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2559/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=491,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2560/500000]
+ optim/total_grad_norm=1.156
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=491,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2561/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=491,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2562/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=491,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2563/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=492,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2564/500000]
+ train/ActionNoiseL2Loss=0.1538
+ throughput/total_tokens=492,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2565/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=492,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2566/500000]
+ train/ActionNoiseL2Loss=0.1865
+ throughput/total_tokens=492,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2567/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=492,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2568/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=493,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2569/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=493,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2570/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=493,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2571/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=493,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2572/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=493,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2573/500000]
+ train/ActionNoiseL2Loss=0.1501
+ throughput/total_tokens=494,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2574/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=494,208,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2575/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=494,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2576/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=494,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2577/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=494,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2578/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=494,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2579/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=495,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2580/500000]
+ optim/total_grad_norm=1.146
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=495,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2581/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=495,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2582/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=495,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2583/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=495,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2584/500000]
+ train/ActionNoiseL2Loss=0.1221
+ throughput/total_tokens=496,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2585/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=496,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2586/500000]
+ train/ActionNoiseL2Loss=0.1260
+ throughput/total_tokens=496,512,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2587/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=496,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2588/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=496,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2589/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=497,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2590/500000]
+ train/ActionNoiseL2Loss=0.1191
+ throughput/total_tokens=497,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2591/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=497,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2592/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=497,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2593/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=497,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2594/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=498,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2595/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=498,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2596/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=498,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2597/500000]
+ train/ActionNoiseL2Loss=0.1142
+ throughput/total_tokens=498,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2598/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=498,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2599/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=499,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2600/500000]
+ optim/total_grad_norm=2.389
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=499,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2601/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=499,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2602/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=499,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2603/500000]
+ train/ActionNoiseL2Loss=0.1650
+ throughput/total_tokens=499,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2604/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=499,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2605/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=500,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2606/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=500,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2607/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=500,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2608/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=500,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2609/500000]
+ train/ActionNoiseL2Loss=0.1480
+ throughput/total_tokens=500,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2610/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=501,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2611/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=501,312,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2612/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=501,504,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2613/500000]
+ train/ActionNoiseL2Loss=0.1694
+ throughput/total_tokens=501,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2614/500000]
+ train/ActionNoiseL2Loss=0.1759
+ throughput/total_tokens=501,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2615/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=502,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2616/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=502,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2617/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=502,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2618/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=502,656,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2619/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=502,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2620/500000]
+ optim/total_grad_norm=1.461
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=503,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2621/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=503,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2622/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=503,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2623/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=503,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2624/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=503,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2625/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=504,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2626/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=504,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2627/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=504,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2628/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=504,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2629/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=504,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2630/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=504,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2631/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=505,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2632/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=505,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2633/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=505,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2634/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=505,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2635/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=505,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2636/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=506,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2637/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=506,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2638/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=506,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2639/500000]
+ train/ActionNoiseL2Loss=0.1585
+ throughput/total_tokens=506,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2640/500000]
+ optim/total_grad_norm=1.816
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=506,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2641/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=507,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2642/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=507,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2643/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=507,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2644/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=507,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2645/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=507,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2646/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=508,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2647/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=508,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2648/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=508,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2649/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=508,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2650/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=508,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2651/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=508,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2652/500000]
+ train/ActionNoiseL2Loss=0.1357
+ throughput/total_tokens=509,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2653/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=509,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2654/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=509,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2655/500000]
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=509,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2656/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=509,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2657/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=510,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2658/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=510,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2659/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=510,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2660/500000]
+ optim/total_grad_norm=0.8850
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=510,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2661/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=510,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2662/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=511,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2663/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=511,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2664/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=511,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2665/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=511,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2666/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=511,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2667/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=512,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2668/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=512,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2669/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=512,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2670/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=512,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2671/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=512,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2672/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=513,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2673/500000]
+ train/ActionNoiseL2Loss=0.1560
+ throughput/total_tokens=513,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2674/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=513,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2675/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=513,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2676/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=513,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2677/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=513,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2678/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=514,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2679/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=514,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2680/500000]
+ optim/total_grad_norm=1.762
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=514,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2681/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=514,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2682/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=514,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2683/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=515,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2684/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=515,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2685/500000]
+ train/ActionNoiseL2Loss=0.1410
+ throughput/total_tokens=515,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2686/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=515,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2687/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=515,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2688/500000]
+ train/ActionNoiseL2Loss=0.1167
+ throughput/total_tokens=516,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2689/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=516,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2690/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=516,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2691/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=516,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2692/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=516,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2693/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=517,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2694/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=517,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2695/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=517,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2696/500000]
+ train/ActionNoiseL2Loss=0.1498
+ throughput/total_tokens=517,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2697/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=517,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2698/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=518,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2699/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=518,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2700/500000]
+ optim/total_grad_norm=1.640
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=518,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2701/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=518,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2702/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=518,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2703/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=518,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2704/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=519,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2705/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=519,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2706/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=519,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2707/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=519,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2708/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=519,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2709/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=520,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2710/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=520,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2711/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=520,512,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2712/500000]
+ train/ActionNoiseL2Loss=0.1658
+ throughput/total_tokens=520,704,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2713/500000]
+ train/ActionNoiseL2Loss=0.1526
+ throughput/total_tokens=520,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2714/500000]
+ train/ActionNoiseL2Loss=0.1538
+ throughput/total_tokens=521,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2715/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=521,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2716/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=521,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2717/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=521,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2718/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=521,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2719/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=522,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2720/500000]
+ optim/total_grad_norm=1.604
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=522,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2721/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=522,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2722/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=522,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2723/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=522,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2724/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=523,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2725/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=523,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2726/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=523,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2727/500000]
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=523,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2728/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=523,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2729/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=523,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2730/500000]
+ train/ActionNoiseL2Loss=0.1508
+ throughput/total_tokens=524,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2731/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=524,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2732/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=524,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2733/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=524,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2734/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=524,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2735/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=525,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2736/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=525,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2737/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=525,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2738/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=525,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2739/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=525,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2740/500000]
+ optim/total_grad_norm=1.450
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=526,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2741/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=526,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2742/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=526,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2743/500000]
+ train/ActionNoiseL2Loss=0.1211
+ throughput/total_tokens=526,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2744/500000]
+ train/ActionNoiseL2Loss=0.1324
+ throughput/total_tokens=526,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2745/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=527,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2746/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=527,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2747/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=527,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2748/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=527,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2749/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=527,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2750/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=528,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2751/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=528,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2752/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=528,384,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2753/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=528,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2754/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=528,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2755/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=528,960,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2756/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=529,152,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2757/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=529,344,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2758/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=529,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2759/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=529,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2760/500000]
+ optim/total_grad_norm=2.375
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=529,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=2761/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=530,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2762/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=530,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2763/500000]
+ train/ActionNoiseL2Loss=0.1494
+ throughput/total_tokens=530,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2764/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=530,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2765/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=530,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2766/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=531,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2767/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=531,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2768/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=531,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2769/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=531,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2770/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=531,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2771/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=532,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2772/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=532,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2773/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=532,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2774/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=532,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2775/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=532,800,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2776/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=532,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2777/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=533,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2778/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=533,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2779/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=533,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2780/500000]
+ optim/total_grad_norm=1.645
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=533,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2781/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=533,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2782/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=534,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2783/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=534,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2784/500000]
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=534,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2785/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=534,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2786/500000]
+ train/ActionNoiseL2Loss=0.1368
+ throughput/total_tokens=534,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2787/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=535,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2788/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=535,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2789/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=535,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2790/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=535,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2791/500000]
+ train/ActionNoiseL2Loss=0.1294
+ throughput/total_tokens=535,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2792/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=536,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2793/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=536,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2794/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=536,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2795/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=536,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2796/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=536,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2797/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=537,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2798/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=537,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2799/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=537,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2800/500000]
+ optim/total_grad_norm=1.266
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=537,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2801/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=537,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2802/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=537,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2803/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=538,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2804/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=538,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2805/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=538,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2806/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=538,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2807/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=538,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2808/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=539,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2809/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=539,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2810/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=539,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2811/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=539,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2812/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=539,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2813/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=540,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2814/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=540,288,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2815/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=540,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2816/500000]
+ train/ActionNoiseL2Loss=0.1333
+ throughput/total_tokens=540,672,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2817/500000]
+ train/ActionNoiseL2Loss=0.1293
+ throughput/total_tokens=540,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2818/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=541,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2819/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=541,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2820/500000]
+ optim/total_grad_norm=1.367
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=541,440,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2821/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=541,632,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2822/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=541,824,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2823/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=542,016,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2824/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=542,208,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2825/500000]
+ train/ActionNoiseL2Loss=0.1554
+ throughput/total_tokens=542,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2826/500000]
+ train/ActionNoiseL2Loss=0.1192
+ throughput/total_tokens=542,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2827/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=542,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2828/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=542,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2829/500000]
+ train/ActionNoiseL2Loss=0.1506
+ throughput/total_tokens=543,168,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2830/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=543,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2831/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=543,552,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2832/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=543,744,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2833/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=543,936,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2834/500000]
+ train/ActionNoiseL2Loss=0.1784
+ throughput/total_tokens=544,128,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2835/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=544,320,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2836/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=544,512,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=2837/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=544,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2838/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=544,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2839/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=545,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2840/500000]
+ optim/total_grad_norm=1.572
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=545,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2841/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=545,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2842/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=545,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2843/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=545,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2844/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=546,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2845/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=546,240,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2846/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=546,432,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2847/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=546,624,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2848/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=546,816,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2849/500000]
+ train/ActionNoiseL2Loss=0.1708
+ throughput/total_tokens=547,008,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2850/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=547,200,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2851/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=547,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2852/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=547,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2853/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=547,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2854/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=547,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2855/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=548,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2856/500000]
+ train/ActionNoiseL2Loss=0.1411
+ throughput/total_tokens=548,352,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2857/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=548,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2858/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=548,736,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2859/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=548,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2860/500000]
+ optim/total_grad_norm=1.269
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=549,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2861/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=549,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2862/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=549,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2863/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=549,696,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2864/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=549,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2865/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=550,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2866/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=550,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2867/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=550,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2868/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=550,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2869/500000]
+ train/ActionNoiseL2Loss=0.1366
+ throughput/total_tokens=550,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2870/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=551,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2871/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=551,232,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2872/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=551,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2873/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=551,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2874/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=551,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2875/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=552,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2876/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=552,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2877/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=552,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2878/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=552,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2879/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=552,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2880/500000]
+ optim/total_grad_norm=0.8905
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=552,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2881/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=553,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2882/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=553,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2883/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=553,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2884/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=553,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2885/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=553,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2886/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=554,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2887/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=554,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2888/500000]
+ train/ActionNoiseL2Loss=0.1511
+ throughput/total_tokens=554,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2889/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=554,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2890/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=554,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2891/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=555,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2892/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=555,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2893/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=555,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2894/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=555,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2895/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=555,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2896/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=556,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2897/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=556,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2898/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=556,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2899/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=556,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2900/500000]
+ optim/total_grad_norm=1.085
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=556,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2901/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=556,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2902/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=557,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2903/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=557,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2904/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=557,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2905/500000]
+ train/ActionNoiseL2Loss=0.1499
+ throughput/total_tokens=557,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2906/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=557,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2907/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=558,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2908/500000]
+ train/ActionNoiseL2Loss=0.1054
+ throughput/total_tokens=558,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2909/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=558,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2910/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=558,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2911/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=558,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2912/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=559,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2913/500000]
+ train/ActionNoiseL2Loss=0.1263
+ throughput/total_tokens=559,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2914/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=559,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2915/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=559,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2916/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=559,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2917/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=560,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2918/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=560,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2919/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=560,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2920/500000]
+ optim/total_grad_norm=1.624
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=560,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2921/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=560,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2922/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=561,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2923/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=561,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2924/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=561,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2925/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=561,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2926/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=561,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2927/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=561,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2928/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=562,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2929/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=562,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2930/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=562,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2931/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=562,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2932/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=562,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2933/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=563,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2934/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=563,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2935/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=563,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2936/500000]
+ train/ActionNoiseL2Loss=0.1353
+ throughput/total_tokens=563,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2937/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=563,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2938/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=564,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2939/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=564,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2940/500000]
+ optim/total_grad_norm=1.320
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=564,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=2941/500000]
+ train/ActionNoiseL2Loss=0.1584
+ throughput/total_tokens=564,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2942/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=564,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=2943/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=565,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2944/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=565,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2945/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=565,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=2946/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=565,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2947/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=565,824,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2948/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=566,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=2949/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=566,208,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=2950/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=566,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=2951/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=566,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2952/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=566,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2953/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=566,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2954/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=567,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2955/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=567,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2956/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=567,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2957/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=567,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2958/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=567,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2959/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=568,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=2960/500000]
+ optim/total_grad_norm=1.062
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=568,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=2961/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=568,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=2962/500000]
+ train/ActionNoiseL2Loss=0.1130
+ throughput/total_tokens=568,704,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2963/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=568,896,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2964/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=569,088,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2965/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=569,280,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2966/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=569,472,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2967/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=569,664,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=2968/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=569,856,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=2969/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=570,048,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=2970/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=570,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2971/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=570,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2972/500000]
+ train/ActionNoiseL2Loss=0.1429
+ throughput/total_tokens=570,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2973/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=570,816,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2974/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=571,008,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2975/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=571,200,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2976/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=571,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=2977/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=571,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2978/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=571,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2979/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=571,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2980/500000]
+ optim/total_grad_norm=1.485
+ train/ActionNoiseL2Loss=0.1064
+ throughput/total_tokens=572,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2981/500000]
+ train/ActionNoiseL2Loss=0.1180
+ throughput/total_tokens=572,352,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2982/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=572,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2983/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=572,736,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2984/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=572,928,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2985/500000]
+ train/ActionNoiseL2Loss=0.1394
+ throughput/total_tokens=573,120,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2986/500000]
+ train/ActionNoiseL2Loss=0.1337
+ throughput/total_tokens=573,312,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2987/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=573,504,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2988/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=573,696,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2989/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=573,888,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2990/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=574,080,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=2991/500000]
+ train/ActionNoiseL2Loss=0.1194
+ throughput/total_tokens=574,272,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2992/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=574,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2993/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=574,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2994/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=574,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=2995/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=575,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2996/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=575,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2997/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=575,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=2998/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=575,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=2999/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=575,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3000/500000]
+ optim/total_grad_norm=1.764
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=576,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/12 [10:29:23] INFO | >> Saving config... checkpoint.py:608
+10/12 [10:30:13] INFO | >> Saving model state... checkpoint.py:796
+10/12 [10:31:26] INFO | >> Saving optim state... checkpoint.py:811
+10/12 [10:32:57] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3001/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=576,192,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=3002/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=576,384,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=3003/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=576,576,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=3004/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=576,768,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=3005/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=576,960,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=3006/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=577,152,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=3007/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=577,344,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=3008/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=577,536,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3009/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=577,728,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3010/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=577,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3011/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=578,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3012/500000]
+ train/ActionNoiseL2Loss=0.1491
+ throughput/total_tokens=578,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3013/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=578,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3014/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=578,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3015/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=578,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3016/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=579,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3017/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=579,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3018/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=579,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3019/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=579,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3020/500000]
+ optim/total_grad_norm=1.662
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=579,840,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3021/500000]
+ train/ActionNoiseL2Loss=0.1123
+ throughput/total_tokens=580,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3022/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=580,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3023/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=580,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3024/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=580,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3025/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=580,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3026/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=580,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3027/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=581,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3028/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=581,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3029/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=581,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3030/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=581,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3031/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=581,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3032/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=582,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3033/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=582,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3034/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=582,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3035/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=582,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3036/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=582,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3037/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=583,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3038/500000]
+ train/ActionNoiseL2Loss=0.1104
+ throughput/total_tokens=583,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3039/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=583,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3040/500000]
+ optim/total_grad_norm=1.627
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=583,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3041/500000]
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=583,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3042/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=584,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3043/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=584,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3044/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=584,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3045/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=584,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3046/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=584,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3047/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=585,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3048/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=585,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3049/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=585,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3050/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=585,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3051/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=585,792,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3052/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=585,984,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3053/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=586,176,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3054/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=586,368,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3055/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=586,560,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=3056/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=586,752,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3057/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=586,944,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3058/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=587,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3059/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=587,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3060/500000]
+ optim/total_grad_norm=1.305
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=587,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=3061/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=587,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3062/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=587,904,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3063/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=588,096,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3064/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=588,288,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3065/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=588,480,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3066/500000]
+ train/ActionNoiseL2Loss=0.1620
+ throughput/total_tokens=588,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3067/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=588,864,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3068/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=589,056,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3069/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=589,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3070/500000]
+ train/ActionNoiseL2Loss=0.1301
+ throughput/total_tokens=589,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3071/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=589,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3072/500000]
+ train/ActionNoiseL2Loss=0.1086
+ throughput/total_tokens=589,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3073/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=590,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3074/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=590,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3075/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=590,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3076/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=590,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3077/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=590,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3078/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=590,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3079/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=591,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3080/500000]
+ optim/total_grad_norm=1.397
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=591,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3081/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=591,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3082/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=591,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3083/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=591,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3084/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=592,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3085/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=592,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3086/500000]
+ train/ActionNoiseL2Loss=0.1095
+ throughput/total_tokens=592,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3087/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=592,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3088/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=592,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3089/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=593,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3090/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=593,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3091/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=593,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3092/500000]
+ train/ActionNoiseL2Loss=0.1359
+ throughput/total_tokens=593,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3093/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=593,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3094/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=594,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3095/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=594,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3096/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=594,432,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3097/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=594,624,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3098/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=594,816,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3099/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=595,008,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3100/500000]
+ optim/total_grad_norm=1.374
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=595,200,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3101/500000]
+ train/ActionNoiseL2Loss=0.1562
+ throughput/total_tokens=595,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3102/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=595,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3103/500000]
+ train/ActionNoiseL2Loss=0.1202
+ throughput/total_tokens=595,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3104/500000]
+ train/ActionNoiseL2Loss=0.1415
+ throughput/total_tokens=595,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3105/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=596,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3106/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=596,352,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3107/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=596,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3108/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=596,736,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3109/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=596,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3110/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=597,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3111/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=597,312,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3112/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=597,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3113/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=597,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3114/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=597,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3115/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=598,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3116/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=598,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3117/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=598,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3118/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=598,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3119/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=598,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3120/500000]
+ optim/total_grad_norm=1.019
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=599,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3121/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=599,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3122/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=599,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3123/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=599,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3124/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=599,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3125/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=600,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3126/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=600,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3127/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=600,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3128/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=600,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3129/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=600,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3130/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=600,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3131/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=601,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3132/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=601,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3133/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=601,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3134/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=601,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3135/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=601,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3136/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=602,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3137/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=602,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3138/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=602,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3139/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=602,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3140/500000]
+ optim/total_grad_norm=1.690
+ train/ActionNoiseL2Loss=0.1217
+ throughput/total_tokens=602,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3141/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=603,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3142/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=603,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3143/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=603,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3144/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=603,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3145/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=603,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3146/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=604,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3147/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=604,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3148/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=604,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3149/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=604,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3150/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=604,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3151/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=604,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3152/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=605,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3153/500000]
+ train/ActionNoiseL2Loss=0.1402
+ throughput/total_tokens=605,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3154/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=605,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3155/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=605,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3156/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=605,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3157/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=606,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3158/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=606,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3159/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=606,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3160/500000]
+ optim/total_grad_norm=0.7630
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=606,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3161/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=606,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3162/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=607,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3163/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=607,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3164/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=607,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3165/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=607,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3166/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=607,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3167/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=608,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3168/500000]
+ train/ActionNoiseL2Loss=0.1512
+ throughput/total_tokens=608,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3169/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=608,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3170/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=608,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3171/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=608,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3172/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=609,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3173/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=609,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3174/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=609,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3175/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=609,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3176/500000]
+ train/ActionNoiseL2Loss=0.1120
+ throughput/total_tokens=609,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3177/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=609,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3178/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=610,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3179/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=610,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3180/500000]
+ optim/total_grad_norm=1.752
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=610,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3181/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=610,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3182/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=610,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3183/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=611,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3184/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=611,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3185/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=611,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3186/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=611,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3187/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=611,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3188/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=612,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3189/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=612,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3190/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=612,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3191/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=612,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3192/500000]
+ train/ActionNoiseL2Loss=0.1516
+ throughput/total_tokens=612,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3193/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=613,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3194/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=613,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3195/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=613,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3196/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=613,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3197/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=613,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3198/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=614,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3199/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=614,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3200/500000]
+ optim/total_grad_norm=1.850
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=614,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3201/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=614,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3202/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=614,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3203/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=614,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3204/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=615,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3205/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=615,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3206/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=615,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3207/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=615,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3208/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=615,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3209/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=616,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3210/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=616,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3211/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=616,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3212/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=616,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3213/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=616,896,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3214/500000]
+ train/ActionNoiseL2Loss=0.1604
+ throughput/total_tokens=617,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3215/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=617,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3216/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=617,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3217/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=617,664,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3218/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=617,856,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3219/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=618,048,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3220/500000]
+ optim/total_grad_norm=1.431
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=618,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3221/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=618,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3222/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=618,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3223/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=618,816,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3224/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=619,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3225/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=619,200,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3226/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=619,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3227/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=619,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3228/500000]
+ train/ActionNoiseL2Loss=0.1509
+ throughput/total_tokens=619,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3229/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=619,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3230/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=620,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3231/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=620,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3232/500000]
+ train/ActionNoiseL2Loss=0.1356
+ throughput/total_tokens=620,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3233/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=620,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3234/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=620,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3235/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=621,120,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3236/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=621,312,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3237/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=621,504,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3238/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=621,696,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3239/500000]
+ train/ActionNoiseL2Loss=0.1117
+ throughput/total_tokens=621,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3240/500000]
+ optim/total_grad_norm=1.916
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=622,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3241/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=622,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3242/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=622,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3243/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=622,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3244/500000]
+ train/ActionNoiseL2Loss=0.1468
+ throughput/total_tokens=622,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3245/500000]
+ train/ActionNoiseL2Loss=0.1063
+ throughput/total_tokens=623,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3246/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=623,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3247/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=623,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3248/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=623,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3249/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=623,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3250/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=624,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3251/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=624,192,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3252/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=624,384,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3253/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=624,576,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3254/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=624,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3255/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=624,960,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3256/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=625,152,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3257/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=625,344,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3258/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=625,536,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3259/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=625,728,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3260/500000]
+ optim/total_grad_norm=1.257
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=625,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3261/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=626,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3262/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=626,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3263/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=626,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3264/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=626,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3265/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=626,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3266/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=627,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3267/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=627,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3268/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=627,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3269/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=627,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3270/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=627,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3271/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=628,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3272/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=628,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3273/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=628,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3274/500000]
+ train/ActionNoiseL2Loss=0.1174
+ throughput/total_tokens=628,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3275/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=628,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3276/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=628,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3277/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=629,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3278/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=629,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3279/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=629,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3280/500000]
+ optim/total_grad_norm=1.808
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=629,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3281/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=629,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=3282/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=630,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3283/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=630,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3284/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=630,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3285/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=630,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3286/500000]
+ train/ActionNoiseL2Loss=0.1568
+ throughput/total_tokens=630,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3287/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=631,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3288/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=631,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3289/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=631,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3290/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=631,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3291/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=631,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3292/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=632,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3293/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=632,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3294/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=632,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3295/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=632,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=3296/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=632,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3297/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=633,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3298/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=633,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3299/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=633,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3300/500000]
+ optim/total_grad_norm=1.354
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=633,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3301/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=633,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3302/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=633,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3303/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=634,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3304/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=634,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3305/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=634,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3306/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=634,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3307/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=634,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3308/500000]
+ train/ActionNoiseL2Loss=0.1413
+ throughput/total_tokens=635,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3309/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=635,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3310/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=635,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3311/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=635,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3312/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=635,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3313/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=636,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3314/500000]
+ train/ActionNoiseL2Loss=0.1057
+ throughput/total_tokens=636,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3315/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=636,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3316/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=636,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3317/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=636,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3318/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=637,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3319/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=637,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3320/500000]
+ optim/total_grad_norm=0.9736
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=637,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3321/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=637,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3322/500000]
+ train/ActionNoiseL2Loss=0.1331
+ throughput/total_tokens=637,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3323/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=638,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3324/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=638,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3325/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=638,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3326/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=638,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3327/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=638,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3328/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=638,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3329/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=639,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3330/500000]
+ train/ActionNoiseL2Loss=0.1251
+ throughput/total_tokens=639,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3331/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=639,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3332/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=639,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3333/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=639,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3334/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=640,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3335/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=640,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3336/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=640,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3337/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=640,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3338/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=640,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3339/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=641,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3340/500000]
+ optim/total_grad_norm=0.9325
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=641,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3341/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=641,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3342/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=641,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3343/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=641,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3344/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=642,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3345/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=642,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3346/500000]
+ train/ActionNoiseL2Loss=0.1463
+ throughput/total_tokens=642,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3347/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=642,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3348/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=642,816,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3349/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=643,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3350/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=643,200,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3351/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=643,392,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3352/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=643,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3353/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=643,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3354/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=643,968,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3355/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=644,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3356/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=644,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3357/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=644,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3358/500000]
+ train/ActionNoiseL2Loss=0.1563
+ throughput/total_tokens=644,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3359/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=644,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3360/500000]
+ optim/total_grad_norm=1.055
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=645,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3361/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=645,312,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3362/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=645,504,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3363/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=645,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3364/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=645,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3365/500000]
+ train/ActionNoiseL2Loss=0.1598
+ throughput/total_tokens=646,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3366/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=646,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3367/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=646,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3368/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=646,656,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3369/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=646,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3370/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=647,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3371/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=647,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3372/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=647,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3373/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=647,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3374/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=647,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3375/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=648,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3376/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=648,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3377/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=648,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3378/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=648,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3379/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=648,768,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3380/500000]
+ optim/total_grad_norm=1.341
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=648,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3381/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=649,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3382/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=649,344,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3383/500000]
+ train/ActionNoiseL2Loss=0.1300
+ throughput/total_tokens=649,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3384/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=649,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3385/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=649,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3386/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=650,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3387/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=650,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3388/500000]
+ train/ActionNoiseL2Loss=0.1204
+ throughput/total_tokens=650,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3389/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=650,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3390/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=650,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3391/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=651,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3392/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=651,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3393/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=651,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3394/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=651,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3395/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=651,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3396/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=652,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3397/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=652,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3398/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=652,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3399/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=652,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3400/500000]
+ optim/total_grad_norm=1.039
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=652,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3401/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=652,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3402/500000]
+ train/ActionNoiseL2Loss=0.1237
+ throughput/total_tokens=653,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3403/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=653,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3404/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=653,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3405/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=653,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3406/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=653,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3407/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=654,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3408/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=654,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3409/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=654,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3410/500000]
+ train/ActionNoiseL2Loss=0.1274
+ throughput/total_tokens=654,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3411/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=654,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3412/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=655,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3413/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=655,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3414/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=655,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3415/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=655,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3416/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=655,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3417/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=656,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3418/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=656,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3419/500000]
+ train/ActionNoiseL2Loss=0.1627
+ throughput/total_tokens=656,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3420/500000]
+ optim/total_grad_norm=2.047
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=656,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3421/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=656,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3422/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=657,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3423/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=657,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3424/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=657,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3425/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=657,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3426/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=657,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3427/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=657,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3428/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=658,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3429/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=658,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3430/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=658,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3431/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=658,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3432/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=658,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3433/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=659,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3434/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=659,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3435/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=659,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3436/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=659,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3437/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=659,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3438/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=660,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3439/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=660,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3440/500000]
+ optim/total_grad_norm=2.316
+ train/ActionNoiseL2Loss=0.1548
+ throughput/total_tokens=660,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3441/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=660,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3442/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=660,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3443/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=661,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3444/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=661,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3445/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=661,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3446/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=661,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3447/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=661,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3448/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=662,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3449/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=662,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3450/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=662,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3451/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=662,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3452/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=662,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3453/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=662,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3454/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=663,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3455/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=663,360,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3456/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=663,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3457/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=663,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3458/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=663,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3459/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=664,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3460/500000]
+ optim/total_grad_norm=1.686
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=664,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3461/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=664,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3462/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=664,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3463/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=664,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3464/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=665,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3465/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=665,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3466/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=665,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3467/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=665,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3468/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=665,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3469/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=666,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3470/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=666,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3471/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=666,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3472/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=666,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3473/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=666,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3474/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=667,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3475/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=667,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3476/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=667,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3477/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=667,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3478/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=667,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3479/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=667,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3480/500000]
+ optim/total_grad_norm=0.9893
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=668,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3481/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=668,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3482/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=668,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3483/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=668,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3484/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=668,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3485/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=669,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3486/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=669,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3487/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=669,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3488/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=669,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3489/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=669,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3490/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=670,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3491/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=670,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3492/500000]
+ train/ActionNoiseL2Loss=0.1456
+ throughput/total_tokens=670,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3493/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=670,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3494/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=670,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3495/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=671,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3496/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=671,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3497/500000]
+ train/ActionNoiseL2Loss=0.1565
+ throughput/total_tokens=671,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3498/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=671,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3499/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=671,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3500/500000]
+ optim/total_grad_norm=1.052
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=672,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/12 [13:28:14] INFO | >> Saving config... checkpoint.py:608
+10/12 [13:28:47] INFO | >> Saving model state... checkpoint.py:796
+10/12 [13:30:01] INFO | >> Saving optim state... checkpoint.py:811
+10/12 [13:31:33] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=3501/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=672,192,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=3502/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=672,384,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=3503/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=672,576,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=3504/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=672,768,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=3505/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=672,960,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=3506/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=673,152,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=3507/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=673,344,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=3508/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=673,536,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=3509/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=673,728,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3510/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=673,920,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=3511/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=674,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3512/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=674,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3513/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=674,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3514/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=674,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3515/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=674,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3516/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=675,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3517/500000]
+ train/ActionNoiseL2Loss=0.1186
+ throughput/total_tokens=675,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3518/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=675,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3519/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=675,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3520/500000]
+ optim/total_grad_norm=1.479
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=675,840,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3521/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=676,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3522/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=676,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3523/500000]
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=676,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3524/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=676,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3525/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=676,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3526/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=676,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3527/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=677,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3528/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=677,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3529/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=677,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3530/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=677,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3531/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=677,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3532/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=678,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3533/500000]
+ train/ActionNoiseL2Loss=0.1634
+ throughput/total_tokens=678,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3534/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=678,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3535/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=678,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3536/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=678,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3537/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=679,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3538/500000]
+ train/ActionNoiseL2Loss=0.1424
+ throughput/total_tokens=679,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3539/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=679,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3540/500000]
+ optim/total_grad_norm=1.872
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=679,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3541/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=679,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3542/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=680,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3543/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=680,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3544/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=680,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3545/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=680,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3546/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=680,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3547/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=681,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3548/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=681,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3549/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=681,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3550/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=681,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3551/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=681,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3552/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=681,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3553/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=682,176,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3554/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=682,368,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3555/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=682,560,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3556/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=682,752,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3557/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=682,944,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3558/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=683,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3559/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=683,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3560/500000]
+ optim/total_grad_norm=0.9537
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=683,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=3561/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=683,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3562/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=683,904,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3563/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=684,096,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3564/500000]
+ train/ActionNoiseL2Loss=0.1106
+ throughput/total_tokens=684,288,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3565/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=684,480,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3566/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=684,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3567/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=684,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3568/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=685,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3569/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=685,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3570/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=685,440,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3571/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=685,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3572/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=685,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3573/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=686,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3574/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=686,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3575/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=686,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3576/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=686,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3577/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=686,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3578/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=686,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3579/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=687,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3580/500000]
+ optim/total_grad_norm=1.213
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=687,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3581/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=687,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3582/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=687,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3583/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=687,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3584/500000]
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=688,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3585/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=688,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3586/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=688,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3587/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=688,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3588/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=688,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3589/500000]
+ train/ActionNoiseL2Loss=0.1786
+ throughput/total_tokens=689,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3590/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=689,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3591/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=689,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3592/500000]
+ train/ActionNoiseL2Loss=0.1249
+ throughput/total_tokens=689,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3593/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=689,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3594/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=690,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3595/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=690,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3596/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=690,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3597/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=690,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3598/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=690,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3599/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=691,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3600/500000]
+ optim/total_grad_norm=1.360
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=691,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3601/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=691,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3602/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=691,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3603/500000]
+ train/ActionNoiseL2Loss=0.1608
+ throughput/total_tokens=691,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3604/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=691,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3605/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=692,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3606/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=692,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3607/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=692,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3608/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=692,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3609/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=692,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3610/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=693,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=3611/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=693,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3612/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=693,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3613/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=693,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3614/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=693,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3615/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=694,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3616/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=694,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3617/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=694,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3618/500000]
+ train/ActionNoiseL2Loss=0.1760
+ throughput/total_tokens=694,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3619/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=694,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3620/500000]
+ optim/total_grad_norm=1.087
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=695,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3621/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=695,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=3622/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=695,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3623/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=695,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3624/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=695,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=3625/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=696,000,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3626/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=696,192,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=3627/500000]
+ train/ActionNoiseL2Loss=0.1606
+ throughput/total_tokens=696,384,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=3628/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=696,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3629/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=696,768,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3630/500000]
+ train/ActionNoiseL2Loss=0.2012
+ throughput/total_tokens=696,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3631/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=697,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3632/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=697,344,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3633/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=697,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3634/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=697,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3635/500000]
+ train/ActionNoiseL2Loss=0.1272
+ throughput/total_tokens=697,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3636/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=698,112,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3637/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=698,304,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3638/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=698,496,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=3639/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=698,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3640/500000]
+ optim/total_grad_norm=1.606
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=698,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3641/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=699,072,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3642/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=699,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3643/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=699,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3644/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=699,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3645/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=699,840,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3646/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=700,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3647/500000]
+ train/ActionNoiseL2Loss=0.1890
+ throughput/total_tokens=700,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3648/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=700,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3649/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=700,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3650/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=700,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3651/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=700,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3652/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=701,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3653/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=701,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3654/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=701,568,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3655/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=701,760,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3656/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=701,952,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3657/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=702,144,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3658/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=702,336,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3659/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=702,528,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3660/500000]
+ optim/total_grad_norm=0.7483
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=702,720,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=3661/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=702,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3662/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=703,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3663/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=703,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3664/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=703,488,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3665/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=703,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3666/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=703,872,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3667/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=704,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3668/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=704,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3669/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=704,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3670/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=704,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3671/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=704,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3672/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=705,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3673/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=705,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3674/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=705,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3675/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=705,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3676/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=705,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3677/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=705,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=3678/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=706,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3679/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=706,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3680/500000]
+ optim/total_grad_norm=1.521
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=706,560,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3681/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=706,752,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3682/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=706,944,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3683/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=707,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3684/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=707,328,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3685/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=707,520,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3686/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=707,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3687/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=707,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3688/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=708,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3689/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=708,288,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3690/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=708,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3691/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=708,672,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3692/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=708,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=3693/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=709,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3694/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=709,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3695/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=709,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3696/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=709,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3697/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=709,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3698/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=710,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3699/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=710,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3700/500000]
+ optim/total_grad_norm=0.8390
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=710,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3701/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=710,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3702/500000]
+ train/ActionNoiseL2Loss=0.1197
+ throughput/total_tokens=710,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3703/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=710,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3704/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=711,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3705/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=711,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3706/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=711,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3707/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=711,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3708/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=711,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3709/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=712,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3710/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=712,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3711/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=712,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3712/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=712,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3713/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=712,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3714/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=713,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3715/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=713,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3716/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=713,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3717/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=713,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3718/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=713,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3719/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=714,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3720/500000]
+ optim/total_grad_norm=1.748
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=714,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3721/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=714,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3722/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=714,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3723/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=714,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3724/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=715,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3725/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=715,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3726/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=715,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3727/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=715,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3728/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=715,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3729/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=715,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3730/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=716,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3731/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=716,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3732/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=716,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3733/500000]
+ train/ActionNoiseL2Loss=0.1513
+ throughput/total_tokens=716,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3734/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=716,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3735/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=717,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3736/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=717,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3737/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=717,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3738/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=717,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3739/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=717,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3740/500000]
+ optim/total_grad_norm=1.478
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=718,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3741/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=718,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3742/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=718,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3743/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=718,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3744/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=718,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3745/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=719,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3746/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=719,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3747/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=719,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3748/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=719,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3749/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=719,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3750/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=720,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3751/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=720,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3752/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=720,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3753/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=720,576,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3754/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=720,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3755/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=720,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3756/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=721,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3757/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=721,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3758/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=721,536,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3759/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=721,728,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3760/500000]
+ optim/total_grad_norm=0.7950
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=721,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3761/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=722,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3762/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=722,304,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3763/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=722,496,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3764/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=722,688,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3765/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=722,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3766/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=723,072,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3767/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=723,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3768/500000]
+ train/ActionNoiseL2Loss=0.0980
+ throughput/total_tokens=723,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3769/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=723,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3770/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=723,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3771/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=724,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3772/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=724,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3773/500000]
+ train/ActionNoiseL2Loss=0.1537
+ throughput/total_tokens=724,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3774/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=724,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3775/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=724,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3776/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=724,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3777/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=725,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3778/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=725,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3779/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=725,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3780/500000]
+ optim/total_grad_norm=0.5458
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=725,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3781/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=725,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3782/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=726,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3783/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=726,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3784/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=726,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3785/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=726,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3786/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=726,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3787/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=727,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3788/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=727,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3789/500000]
+ train/ActionNoiseL2Loss=0.1364
+ throughput/total_tokens=727,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3790/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=727,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3791/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=727,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3792/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=728,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3793/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=728,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3794/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=728,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3795/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=728,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3796/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=728,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3797/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=729,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3798/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=729,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3799/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=729,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3800/500000]
+ optim/total_grad_norm=1.403
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=729,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3801/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=729,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3802/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=729,984,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3803/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=730,176,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=3804/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=730,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3805/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=730,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3806/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=730,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3807/500000]
+ train/ActionNoiseL2Loss=0.0968
+ throughput/total_tokens=730,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3808/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=731,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3809/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=731,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3810/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=731,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3811/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=731,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3812/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=731,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3813/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=732,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3814/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=732,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3815/500000]
+ train/ActionNoiseL2Loss=0.1150
+ throughput/total_tokens=732,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3816/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=732,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3817/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=732,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3818/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=733,056,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3819/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=733,248,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3820/500000]
+ optim/total_grad_norm=1.164
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=733,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3821/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=733,632,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3822/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=733,824,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3823/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=734,016,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3824/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=734,208,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3825/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=734,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3826/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=734,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3827/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=734,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3828/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=734,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3829/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=735,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3830/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=735,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3831/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=735,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3832/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=735,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3833/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=735,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3834/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=736,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3835/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=736,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3836/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=736,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3837/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=736,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3838/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=736,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3839/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=737,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3840/500000]
+ optim/total_grad_norm=0.8706
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=737,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3841/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=737,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3842/500000]
+ train/ActionNoiseL2Loss=0.1326
+ throughput/total_tokens=737,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3843/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=737,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3844/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=738,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3845/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=738,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3846/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=738,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3847/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=738,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3848/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=738,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3849/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=739,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3850/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=739,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3851/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=739,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3852/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=739,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3853/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=739,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3854/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=739,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3855/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=740,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3856/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=740,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3857/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=740,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3858/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=740,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3859/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=740,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3860/500000]
+ optim/total_grad_norm=1.093
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=741,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3861/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=741,312,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3862/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=741,504,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3863/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=741,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3864/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=741,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3865/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=742,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3866/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=742,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3867/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=742,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3868/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=742,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3869/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=742,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3870/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=743,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3871/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=743,232,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3872/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=743,424,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3873/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=743,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3874/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=743,808,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3875/500000]
+ train/ActionNoiseL2Loss=0.1409
+ throughput/total_tokens=744,000,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3876/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=744,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3877/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=744,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3878/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=744,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3879/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=744,768,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=3880/500000]
+ optim/total_grad_norm=1.006
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=744,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=3881/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=745,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3882/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=745,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3883/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=745,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3884/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=745,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=3885/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=745,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3886/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=746,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3887/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=746,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=3888/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=746,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3889/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=746,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3890/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=746,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3891/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=747,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3892/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=747,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3893/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=747,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3894/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=747,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3895/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=747,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3896/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=748,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3897/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=748,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3898/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=748,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3899/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=748,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3900/500000]
+ optim/total_grad_norm=0.9885
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=748,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3901/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=748,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3902/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=749,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3903/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=749,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3904/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=749,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3905/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=749,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3906/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=749,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3907/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=750,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3908/500000]
+ train/ActionNoiseL2Loss=0.1385
+ throughput/total_tokens=750,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3909/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=750,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3910/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=750,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3911/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=750,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3912/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=751,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3913/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=751,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3914/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=751,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3915/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=751,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3916/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=751,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3917/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=752,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3918/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=752,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=3919/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=752,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3920/500000]
+ optim/total_grad_norm=0.8199
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=752,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3921/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=752,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3922/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=753,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3923/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=753,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3924/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=753,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3925/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=753,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3926/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=753,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3927/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=753,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3928/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=754,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3929/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=754,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3930/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=754,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3931/500000]
+ train/ActionNoiseL2Loss=0.1338
+ throughput/total_tokens=754,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3932/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=754,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3933/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=755,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3934/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=755,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3935/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=755,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3936/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=755,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3937/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=755,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3938/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=756,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3939/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=756,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3940/500000]
+ optim/total_grad_norm=2.372
+ train/ActionNoiseL2Loss=0.1271
+ throughput/total_tokens=756,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3941/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=756,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3942/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=756,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3943/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=757,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3944/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=757,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3945/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=757,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3946/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=757,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3947/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=757,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3948/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=758,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3949/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=758,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3950/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=758,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3951/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=758,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3952/500000]
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=758,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3953/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=758,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=3954/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=759,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3955/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=759,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3956/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=759,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3957/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=759,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3958/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=759,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3959/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=760,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3960/500000]
+ optim/total_grad_norm=1.039
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=760,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=3961/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=760,512,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3962/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=760,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3963/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=760,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3964/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=761,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3965/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=761,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=3966/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=761,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3967/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=761,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3968/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=761,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3969/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=762,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=3970/500000]
+ train/ActionNoiseL2Loss=0.1599
+ throughput/total_tokens=762,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3971/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=762,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3972/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=762,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3973/500000]
+ train/ActionNoiseL2Loss=0.0969
+ throughput/total_tokens=762,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3974/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=763,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3975/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=763,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3976/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=763,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3977/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=763,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3978/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=763,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3979/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=763,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3980/500000]
+ optim/total_grad_norm=1.729
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=764,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3981/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=764,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3982/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=764,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3983/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=764,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3984/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=764,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3985/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=765,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3986/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=765,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3987/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=765,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3988/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=765,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3989/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=765,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3990/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=766,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=3991/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=766,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3992/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=766,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3993/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=766,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3994/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=766,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3995/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=767,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3996/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=767,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=3997/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=767,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3998/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=767,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=3999/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=767,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4000/500000]
+ optim/total_grad_norm=1.330
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=768,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/12 [16:27:17] INFO | >> Saving config... checkpoint.py:608
+10/12 [16:27:49] INFO | >> Saving model state... checkpoint.py:796
+10/12 [16:29:02] INFO | >> Saving optim state... checkpoint.py:811
+10/12 [16:30:34] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4001/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=768,192,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0471
+[step=4002/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=768,384,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=4003/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=768,576,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=4004/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=768,768,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=4005/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=768,960,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=4006/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=769,152,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=4007/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=769,344,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4008/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=769,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4009/500000]
+ train/ActionNoiseL2Loss=0.1170
+ throughput/total_tokens=769,728,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4010/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=769,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=4011/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=770,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4012/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=770,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4013/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=770,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4014/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=770,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4015/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=770,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4016/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=771,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4017/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=771,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4018/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=771,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4019/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=771,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4020/500000]
+ optim/total_grad_norm=1.213
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=771,840,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4021/500000]
+ train/ActionNoiseL2Loss=0.1550
+ throughput/total_tokens=772,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4022/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=772,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4023/500000]
+ train/ActionNoiseL2Loss=0.1341
+ throughput/total_tokens=772,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4024/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=772,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4025/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=772,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4026/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=772,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4027/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=773,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4028/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=773,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4029/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=773,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4030/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=773,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4031/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=773,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4032/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=774,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4033/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=774,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4034/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=774,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4035/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=774,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4036/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=774,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4037/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=775,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4038/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=775,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4039/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=775,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4040/500000]
+ optim/total_grad_norm=1.014
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=775,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4041/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=775,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4042/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=776,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4043/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=776,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4044/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=776,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4045/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=776,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4046/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=776,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4047/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=777,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4048/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=777,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4049/500000]
+ train/ActionNoiseL2Loss=0.1220
+ throughput/total_tokens=777,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4050/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=777,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4051/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=777,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4052/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=777,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4053/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=778,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4054/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=778,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4055/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=778,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4056/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=778,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4057/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=778,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4058/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=779,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4059/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=779,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4060/500000]
+ optim/total_grad_norm=1.418
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=779,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4061/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=779,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4062/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=779,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4063/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=780,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4064/500000]
+ train/ActionNoiseL2Loss=0.1071
+ throughput/total_tokens=780,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4065/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=780,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4066/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=780,672,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4067/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=780,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4068/500000]
+ train/ActionNoiseL2Loss=0.1288
+ throughput/total_tokens=781,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4069/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=781,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4070/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=781,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4071/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=781,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4072/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=781,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4073/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=782,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4074/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=782,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4075/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=782,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4076/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=782,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4077/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=782,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4078/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=782,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4079/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=783,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4080/500000]
+ optim/total_grad_norm=1.134
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=783,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4081/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=783,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4082/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=783,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4083/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=783,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4084/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=784,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4085/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=784,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4086/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=784,512,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4087/500000]
+ train/ActionNoiseL2Loss=0.1263
+ throughput/total_tokens=784,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4088/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=784,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4089/500000]
+ train/ActionNoiseL2Loss=0.1296
+ throughput/total_tokens=785,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4090/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=785,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4091/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=785,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4092/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=785,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4093/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=785,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4094/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=786,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4095/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=786,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4096/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=786,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4097/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=786,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4098/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=786,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4099/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=787,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4100/500000]
+ optim/total_grad_norm=1.093
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=787,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4101/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=787,392,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4102/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=787,584,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4103/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=787,776,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=4104/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=787,968,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4105/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=788,160,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4106/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=788,352,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4107/500000]
+ train/ActionNoiseL2Loss=0.1179
+ throughput/total_tokens=788,544,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4108/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=788,736,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4109/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=788,928,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4110/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=789,120,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+ System/Peak GPU Memory (MB)=51,074
+[step=4111/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=789,312,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=4112/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=789,504,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=4113/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=789,696,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0475
+[step=4114/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=789,888,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4115/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=790,080,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4116/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=790,272,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4117/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=790,464,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4118/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=790,656,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4119/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=790,848,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=4120/500000]
+ optim/total_grad_norm=2.612
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=791,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4121/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=791,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4122/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=791,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4123/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=791,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4124/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=791,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4125/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=792,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4126/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=792,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4127/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=792,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4128/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=792,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4129/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=792,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4130/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=792,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4131/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=793,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4132/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=793,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4133/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=793,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4134/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=793,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4135/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=793,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4136/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=794,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4137/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=794,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4138/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=794,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4139/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=794,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4140/500000]
+ optim/total_grad_norm=1.235
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=794,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4141/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=795,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4142/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=795,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4143/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=795,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4144/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=795,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4145/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=795,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4146/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=796,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4147/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=796,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4148/500000]
+ train/ActionNoiseL2Loss=0.1234
+ throughput/total_tokens=796,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4149/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=796,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4150/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=796,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4151/500000]
+ train/ActionNoiseL2Loss=0.1335
+ throughput/total_tokens=796,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4152/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=797,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4153/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=797,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4154/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=797,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4155/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=797,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4156/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=797,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4157/500000]
+ train/ActionNoiseL2Loss=0.1268
+ throughput/total_tokens=798,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4158/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=798,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4159/500000]
+ train/ActionNoiseL2Loss=0.1223
+ throughput/total_tokens=798,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4160/500000]
+ optim/total_grad_norm=1.384
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=798,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4161/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=798,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4162/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=799,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4163/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=799,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4164/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=799,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4165/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=799,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4166/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=799,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4167/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=800,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4168/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=800,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4169/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=800,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4170/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=800,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4171/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=800,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4172/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=801,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4173/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=801,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4174/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=801,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4175/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=801,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4176/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=801,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4177/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=801,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4178/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=802,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4179/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=802,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4180/500000]
+ optim/total_grad_norm=1.144
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=802,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4181/500000]
+ train/ActionNoiseL2Loss=0.0935
+ throughput/total_tokens=802,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4182/500000]
+ train/ActionNoiseL2Loss=0.1232
+ throughput/total_tokens=802,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4183/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=803,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4184/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=803,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4185/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=803,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4186/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=803,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4187/500000]
+ train/ActionNoiseL2Loss=0.1135
+ throughput/total_tokens=803,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4188/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=804,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4189/500000]
+ train/ActionNoiseL2Loss=0.1474
+ throughput/total_tokens=804,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4190/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=804,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4191/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=804,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4192/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=804,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4193/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=805,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4194/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=805,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4195/500000]
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=805,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4196/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=805,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4197/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=805,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4198/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=806,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4199/500000]
+ train/ActionNoiseL2Loss=0.1093
+ throughput/total_tokens=806,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4200/500000]
+ optim/total_grad_norm=1.484
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=806,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4201/500000]
+ train/ActionNoiseL2Loss=0.1445
+ throughput/total_tokens=806,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4202/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=806,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4203/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=806,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4204/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=807,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4205/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=807,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4206/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=807,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4207/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=807,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4208/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=807,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4209/500000]
+ train/ActionNoiseL2Loss=0.1376
+ throughput/total_tokens=808,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4210/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=808,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4211/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=808,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4212/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=808,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4213/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=808,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4214/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=809,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4215/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=809,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4216/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=809,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4217/500000]
+ train/ActionNoiseL2Loss=0.1166
+ throughput/total_tokens=809,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4218/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=809,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4219/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=810,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4220/500000]
+ optim/total_grad_norm=1.168
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=810,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4221/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=810,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4222/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=810,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4223/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=810,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4224/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=811,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4225/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=811,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4226/500000]
+ train/ActionNoiseL2Loss=0.1304
+ throughput/total_tokens=811,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4227/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=811,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4228/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=811,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4229/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=811,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4230/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=812,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4231/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=812,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4232/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=812,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4233/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=812,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4234/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=812,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4235/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=813,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4236/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=813,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4237/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=813,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4238/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=813,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4239/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=813,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4240/500000]
+ optim/total_grad_norm=1.436
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=814,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4241/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=814,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4242/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=814,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4243/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=814,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4244/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=814,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4245/500000]
+ train/ActionNoiseL2Loss=0.1036
+ throughput/total_tokens=815,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4246/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=815,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4247/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=815,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4248/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=815,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4249/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=815,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4250/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=816,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4251/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=816,192,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4252/500000]
+ train/ActionNoiseL2Loss=0.1440
+ throughput/total_tokens=816,384,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4253/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=816,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4254/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=816,768,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4255/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=816,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4256/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=817,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4257/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=817,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4258/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=817,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4259/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=817,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4260/500000]
+ optim/total_grad_norm=0.9601
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=817,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4261/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=818,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4262/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=818,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4263/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=818,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4264/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=818,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4265/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=818,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4266/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=819,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4267/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=819,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4268/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=819,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4269/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=819,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4270/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=819,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4271/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=820,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4272/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=820,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4273/500000]
+ train/ActionNoiseL2Loss=0.1169
+ throughput/total_tokens=820,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4274/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=820,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4275/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=820,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4276/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=820,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4277/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=821,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4278/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=821,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4279/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=821,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4280/500000]
+ optim/total_grad_norm=1.651
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=821,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4281/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=821,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4282/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=822,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4283/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=822,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4284/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=822,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4285/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=822,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4286/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=822,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4287/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=823,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4288/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=823,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4289/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=823,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4290/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=823,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4291/500000]
+ train/ActionNoiseL2Loss=0.1176
+ throughput/total_tokens=823,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4292/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=824,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4293/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=824,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4294/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=824,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4295/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=824,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4296/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=824,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4297/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=825,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4298/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=825,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4299/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=825,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4300/500000]
+ optim/total_grad_norm=1.324
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=825,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4301/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=825,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4302/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=825,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4303/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=826,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4304/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=826,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4305/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=826,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4306/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=826,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4307/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=826,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4308/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=827,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4309/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=827,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4310/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=827,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=4311/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=827,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4312/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=827,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4313/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=828,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4314/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=828,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4315/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=828,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4316/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=828,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4317/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=828,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4318/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=829,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4319/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=829,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4320/500000]
+ optim/total_grad_norm=1.118
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=829,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4321/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=829,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4322/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=829,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4323/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=830,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4324/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=830,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4325/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=830,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4326/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=830,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4327/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=830,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4328/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=830,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4329/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=831,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4330/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=831,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4331/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=831,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4332/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=831,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4333/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=831,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4334/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=832,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4335/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=832,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4336/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=832,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4337/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=832,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4338/500000]
+ train/ActionNoiseL2Loss=0.1344
+ throughput/total_tokens=832,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4339/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=833,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4340/500000]
+ optim/total_grad_norm=1.489
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=833,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4341/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=833,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4342/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=833,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4343/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=833,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4344/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=834,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4345/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=834,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4346/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=834,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4347/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=834,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4348/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=834,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4349/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=835,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4350/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=835,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4351/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=835,392,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=4352/500000]
+ train/ActionNoiseL2Loss=0.1162
+ throughput/total_tokens=835,584,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=4353/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=835,776,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4354/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=835,968,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4355/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=836,160,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4356/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=836,352,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=4357/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=836,544,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4358/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=836,736,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4359/500000]
+ train/ActionNoiseL2Loss=0.1314
+ throughput/total_tokens=836,928,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4360/500000]
+ optim/total_grad_norm=0.9375
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=837,120,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=51,074
+[step=4361/500000]
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=837,312,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4362/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=837,504,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=4363/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=837,696,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4364/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=837,888,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4365/500000]
+ train/ActionNoiseL2Loss=0.1607
+ throughput/total_tokens=838,080,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=4366/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=838,272,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=4367/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=838,464,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=4368/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=838,656,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=4369/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=838,848,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=4370/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=839,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4371/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=839,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4372/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=839,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4373/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=839,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4374/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=839,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4375/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=840,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4376/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=840,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4377/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=840,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4378/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=840,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4379/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=840,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4380/500000]
+ optim/total_grad_norm=1.157
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=840,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4381/500000]
+ train/ActionNoiseL2Loss=0.1361
+ throughput/total_tokens=841,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4382/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=841,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4383/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=841,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4384/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=841,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4385/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=841,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4386/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=842,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4387/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=842,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4388/500000]
+ train/ActionNoiseL2Loss=0.1126
+ throughput/total_tokens=842,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4389/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=842,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4390/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=842,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4391/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=843,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4392/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=843,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4393/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=843,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4394/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=843,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4395/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=843,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4396/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=844,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4397/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=844,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4398/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=844,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4399/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=844,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4400/500000]
+ optim/total_grad_norm=1.230
+ train/ActionNoiseL2Loss=0.1029
+ throughput/total_tokens=844,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4401/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=844,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4402/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=845,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4403/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=845,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4404/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=845,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4405/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=845,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4406/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=845,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4407/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=846,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4408/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=846,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4409/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=846,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4410/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=846,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4411/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=846,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4412/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=847,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4413/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=847,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4414/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=847,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4415/500000]
+ train/ActionNoiseL2Loss=0.1209
+ throughput/total_tokens=847,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4416/500000]
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=847,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4417/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=848,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4418/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=848,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4419/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=848,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4420/500000]
+ optim/total_grad_norm=1.064
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=848,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4421/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=848,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4422/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=849,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4423/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=849,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4424/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=849,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4425/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=849,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4426/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=849,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4427/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=849,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4428/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=850,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4429/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=850,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4430/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=850,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4431/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=850,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4432/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=850,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4433/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=851,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4434/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=851,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4435/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=851,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4436/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=851,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4437/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=851,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4438/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=852,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4439/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=852,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4440/500000]
+ optim/total_grad_norm=1.805
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=852,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4441/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=852,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4442/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=852,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4443/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=853,056,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4444/500000]
+ train/ActionNoiseL2Loss=0.1285
+ throughput/total_tokens=853,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4445/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=853,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4446/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=853,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4447/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=853,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4448/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=854,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4449/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=854,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4450/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=854,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4451/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=854,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4452/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=854,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4453/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=854,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4454/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=855,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4455/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=855,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4456/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=855,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4457/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=855,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4458/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=855,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4459/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=856,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4460/500000]
+ optim/total_grad_norm=0.8077
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=856,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4461/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=856,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4462/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=856,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4463/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=856,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4464/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=857,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4465/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=857,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4466/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=857,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4467/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=857,664,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4468/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=857,856,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4469/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=858,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4470/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=858,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4471/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=858,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4472/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=858,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4473/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=858,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4474/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=859,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4475/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=859,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4476/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=859,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4477/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=859,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4478/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=859,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4479/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=859,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4480/500000]
+ optim/total_grad_norm=0.7548
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=860,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4481/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=860,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4482/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=860,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4483/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=860,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4484/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=860,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4485/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=861,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4486/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=861,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4487/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=861,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4488/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=861,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4489/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=861,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4490/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=862,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4491/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=862,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4492/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=862,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4493/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=862,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4494/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=862,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4495/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=863,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4496/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=863,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4497/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=863,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4498/500000]
+ train/ActionNoiseL2Loss=0.1355
+ throughput/total_tokens=863,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4499/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=863,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4500/500000]
+ optim/total_grad_norm=0.9947
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=864,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/12 [19:25:49] INFO | >> Saving config... checkpoint.py:608
+10/12 [19:26:39] INFO | >> Saving model state... checkpoint.py:796
+10/12 [19:27:50] INFO | >> Saving optim state... checkpoint.py:811
+10/12 [19:29:22] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=4501/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=864,192,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=4502/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=864,384,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=4503/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=864,576,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=4504/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=864,768,000
+ throughput/device/tokens_per_second=1,126
+ throughput/device/batches_per_second=0.0469
+[step=4505/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=864,960,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=4506/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=865,152,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=4507/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=865,344,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=4508/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=865,536,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=4509/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=865,728,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=4510/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=865,920,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=51,074
+[step=4511/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=866,112,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=4512/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=866,304,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=4513/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=866,496,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=4514/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=866,688,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=4515/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=866,880,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=4516/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=867,072,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=4517/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=867,264,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=4518/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=867,456,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=4519/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=867,648,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4520/500000]
+ optim/total_grad_norm=0.7646
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=867,840,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=4521/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=868,032,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4522/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=868,224,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4523/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=868,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4524/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=868,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4525/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=868,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4526/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=868,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4527/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=869,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4528/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=869,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4529/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=869,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4530/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=869,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4531/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=869,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4532/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=870,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4533/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=870,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4534/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=870,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4535/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=870,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4536/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=870,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4537/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=871,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4538/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=871,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4539/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=871,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4540/500000]
+ optim/total_grad_norm=0.9561
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=871,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4541/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=871,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4542/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=872,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4543/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=872,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4544/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=872,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4545/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=872,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4546/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=872,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4547/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=873,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4548/500000]
+ train/ActionNoiseL2Loss=0.1245
+ throughput/total_tokens=873,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4549/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=873,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4550/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=873,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4551/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=873,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4552/500000]
+ train/ActionNoiseL2Loss=0.1448
+ throughput/total_tokens=873,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4553/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=874,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4554/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=874,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4555/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=874,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4556/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=874,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4557/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=874,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4558/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=875,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4559/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=875,328,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4560/500000]
+ optim/total_grad_norm=1.641
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=875,520,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4561/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=875,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4562/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=875,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4563/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=876,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4564/500000]
+ train/ActionNoiseL2Loss=0.1629
+ throughput/total_tokens=876,288,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4565/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=876,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4566/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=876,672,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4567/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=876,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4568/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=877,056,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4569/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=877,248,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4570/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=877,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4571/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=877,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4572/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=877,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4573/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=878,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4574/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=878,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4575/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=878,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4576/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=878,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4577/500000]
+ train/ActionNoiseL2Loss=0.0246
+ throughput/total_tokens=878,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4578/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=878,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4579/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=879,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4580/500000]
+ optim/total_grad_norm=0.7975
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=879,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4581/500000]
+ train/ActionNoiseL2Loss=0.1091
+ throughput/total_tokens=879,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4582/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=879,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4583/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=879,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4584/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=880,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4585/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=880,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4586/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=880,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4587/500000]
+ train/ActionNoiseL2Loss=0.1519
+ throughput/total_tokens=880,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4588/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=880,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4589/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=881,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4590/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=881,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4591/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=881,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4592/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=881,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4593/500000]
+ train/ActionNoiseL2Loss=0.1161
+ throughput/total_tokens=881,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4594/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=882,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4595/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=882,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4596/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=882,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4597/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=882,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4598/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=882,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4599/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=883,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4600/500000]
+ optim/total_grad_norm=0.5985
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=883,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4601/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=883,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4602/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=883,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4603/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=883,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4604/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=883,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4605/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=884,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4606/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=884,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4607/500000]
+ train/ActionNoiseL2Loss=0.0235
+ throughput/total_tokens=884,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4608/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=884,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4609/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=884,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4610/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=885,120,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=4611/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=885,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4612/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=885,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4613/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=885,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4614/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=885,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4615/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=886,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4616/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=886,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4617/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=886,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4618/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=886,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4619/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=886,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4620/500000]
+ optim/total_grad_norm=0.9250
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=887,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4621/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=887,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4622/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=887,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4623/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=887,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4624/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=887,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4625/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=888,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4626/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=888,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4627/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=888,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4628/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=888,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4629/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=888,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4630/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=888,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4631/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=889,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4632/500000]
+ train/ActionNoiseL2Loss=0.1121
+ throughput/total_tokens=889,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4633/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=889,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4634/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=889,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4635/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=889,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4636/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=890,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4637/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=890,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4638/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=890,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4639/500000]
+ train/ActionNoiseL2Loss=0.1241
+ throughput/total_tokens=890,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4640/500000]
+ optim/total_grad_norm=0.9694
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=890,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4641/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=891,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4642/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=891,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4643/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=891,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4644/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=891,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4645/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=891,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4646/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=892,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4647/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=892,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4648/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=892,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4649/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=892,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4650/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=892,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4651/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=892,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4652/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=893,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4653/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=893,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4654/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=893,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4655/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=893,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4656/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=893,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4657/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=894,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4658/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=894,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4659/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=894,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4660/500000]
+ optim/total_grad_norm=1.121
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=894,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=4661/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=894,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4662/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=895,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4663/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=895,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4664/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=895,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4665/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=895,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4666/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=895,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4667/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=896,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4668/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=896,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4669/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=896,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4670/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=896,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4671/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=896,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4672/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=897,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4673/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=897,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4674/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=897,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4675/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=897,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4676/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=897,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4677/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=897,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4678/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=898,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4679/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=898,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4680/500000]
+ optim/total_grad_norm=0.9191
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=898,560,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4681/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=898,752,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4682/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=898,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4683/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=899,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4684/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=899,328,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4685/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=899,520,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4686/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=899,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4687/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=899,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4688/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=900,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4689/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=900,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4690/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=900,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4691/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=900,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4692/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=900,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4693/500000]
+ train/ActionNoiseL2Loss=0.1079
+ throughput/total_tokens=901,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4694/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=901,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4695/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=901,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4696/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=901,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4697/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=901,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4698/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=902,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4699/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=902,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4700/500000]
+ optim/total_grad_norm=1.303
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=902,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4701/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=902,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4702/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=902,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4703/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=902,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4704/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=903,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4705/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=903,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4706/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=903,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4707/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=903,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4708/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=903,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4709/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=904,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4710/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=904,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4711/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=904,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4712/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=904,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4713/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=904,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4714/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=905,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4715/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=905,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4716/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=905,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4717/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=905,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4718/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=905,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4719/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=906,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4720/500000]
+ optim/total_grad_norm=1.419
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=906,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4721/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=906,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4722/500000]
+ train/ActionNoiseL2Loss=0.1582
+ throughput/total_tokens=906,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4723/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=906,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4724/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=907,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4725/500000]
+ train/ActionNoiseL2Loss=0.1336
+ throughput/total_tokens=907,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4726/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=907,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4727/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=907,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4728/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=907,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4729/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=907,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4730/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=908,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4731/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=908,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4732/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=908,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4733/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=908,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4734/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=908,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4735/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=909,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4736/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=909,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4737/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=909,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4738/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=909,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4739/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=909,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4740/500000]
+ optim/total_grad_norm=0.6037
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=910,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4741/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=910,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4742/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=910,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4743/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=910,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4744/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=910,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4745/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=911,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4746/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=911,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4747/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=911,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4748/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=911,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4749/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=911,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4750/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=912,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4751/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=912,192,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4752/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=912,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4753/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=912,576,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4754/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=912,768,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4755/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=912,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4756/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=913,152,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4757/500000]
+ train/ActionNoiseL2Loss=0.1146
+ throughput/total_tokens=913,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4758/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=913,536,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4759/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=913,728,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4760/500000]
+ optim/total_grad_norm=1.407
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=913,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4761/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=914,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4762/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=914,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4763/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=914,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4764/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=914,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4765/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=914,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4766/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=915,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4767/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=915,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4768/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=915,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4769/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=915,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4770/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=915,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4771/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=916,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4772/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=916,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4773/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=916,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4774/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=916,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4775/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=916,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4776/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=916,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4777/500000]
+ train/ActionNoiseL2Loss=0.1216
+ throughput/total_tokens=917,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4778/500000]
+ train/ActionNoiseL2Loss=0.1215
+ throughput/total_tokens=917,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4779/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=917,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4780/500000]
+ optim/total_grad_norm=1.536
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=917,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4781/500000]
+ train/ActionNoiseL2Loss=0.1365
+ throughput/total_tokens=917,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4782/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=918,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4783/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=918,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4784/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=918,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4785/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=918,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4786/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=918,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4787/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=919,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4788/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=919,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4789/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=919,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4790/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=919,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4791/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=919,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4792/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=920,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4793/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=920,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4794/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=920,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4795/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=920,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4796/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=920,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4797/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=921,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4798/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=921,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4799/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=921,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4800/500000]
+ optim/total_grad_norm=1.393
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=921,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4801/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=921,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4802/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=921,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4803/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=922,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4804/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=922,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4805/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=922,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4806/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=922,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4807/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=922,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4808/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=923,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4809/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=923,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4810/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=923,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4811/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=923,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4812/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=923,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4813/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=924,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4814/500000]
+ train/ActionNoiseL2Loss=0.1364
+ throughput/total_tokens=924,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4815/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=924,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4816/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=924,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4817/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=924,864,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4818/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=925,056,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4819/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=925,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4820/500000]
+ optim/total_grad_norm=1.458
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=925,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4821/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=925,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4822/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=925,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4823/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=926,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4824/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=926,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4825/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=926,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4826/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=926,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4827/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=926,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4828/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=926,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4829/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=927,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4830/500000]
+ train/ActionNoiseL2Loss=0.1541
+ throughput/total_tokens=927,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4831/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=927,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4832/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=927,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4833/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=927,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4834/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=928,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4835/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=928,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4836/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=928,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4837/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=928,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4838/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=928,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4839/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=929,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4840/500000]
+ optim/total_grad_norm=0.8004
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=929,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4841/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=929,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4842/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=929,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4843/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=929,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4844/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=930,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4845/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=930,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4846/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=930,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4847/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=930,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4848/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=930,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4849/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=931,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4850/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=931,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4851/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=931,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4852/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=931,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4853/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=931,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4854/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=931,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4855/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=932,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4856/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=932,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4857/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=932,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=4858/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=932,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4859/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=932,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4860/500000]
+ optim/total_grad_norm=2.659
+ train/ActionNoiseL2Loss=0.1654
+ throughput/total_tokens=933,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4861/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=933,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4862/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=933,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4863/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=933,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4864/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=933,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4865/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=934,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4866/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=934,272,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4867/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=934,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=4868/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=934,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4869/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=934,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=4870/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=935,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4871/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=935,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4872/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=935,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4873/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=935,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4874/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=935,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4875/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=936,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4876/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=936,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4877/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=936,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4878/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=936,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4879/500000]
+ train/ActionNoiseL2Loss=0.1213
+ throughput/total_tokens=936,768,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4880/500000]
+ optim/total_grad_norm=0.7417
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=936,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4881/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=937,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4882/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=937,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=4883/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=937,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4884/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=937,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4885/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=937,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4886/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=938,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4887/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=938,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4888/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=938,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4889/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=938,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4890/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=938,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4891/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=939,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4892/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=939,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4893/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=939,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4894/500000]
+ train/ActionNoiseL2Loss=0.1420
+ throughput/total_tokens=939,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4895/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=939,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4896/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=940,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4897/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=940,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4898/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=940,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4899/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=940,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4900/500000]
+ optim/total_grad_norm=0.9992
+ train/ActionNoiseL2Loss=0.1182
+ throughput/total_tokens=940,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4901/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=940,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4902/500000]
+ train/ActionNoiseL2Loss=0.0966
+ throughput/total_tokens=941,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4903/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=941,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4904/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=941,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4905/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=941,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4906/500000]
+ train/ActionNoiseL2Loss=0.1083
+ throughput/total_tokens=941,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4907/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=942,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4908/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=942,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4909/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=942,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4910/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=942,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4911/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=942,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4912/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=943,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4913/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=943,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4914/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=943,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4915/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=943,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4916/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=943,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4917/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=944,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4918/500000]
+ train/ActionNoiseL2Loss=0.1139
+ throughput/total_tokens=944,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4919/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=944,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4920/500000]
+ optim/total_grad_norm=1.357
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=944,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4921/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=944,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4922/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=945,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4923/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=945,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4924/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=945,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4925/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=945,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4926/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=945,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4927/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=945,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4928/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=946,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4929/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=946,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4930/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=946,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4931/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=946,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4932/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=946,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4933/500000]
+ train/ActionNoiseL2Loss=0.1275
+ throughput/total_tokens=947,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4934/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=947,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4935/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=947,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4936/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=947,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4937/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=947,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4938/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=948,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4939/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=948,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4940/500000]
+ optim/total_grad_norm=1.075
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=948,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4941/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=948,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4942/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=948,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4943/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=949,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4944/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=949,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4945/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=949,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4946/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=949,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4947/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=949,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4948/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=950,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4949/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=950,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4950/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=950,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4951/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=950,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4952/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=950,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4953/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=950,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4954/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=951,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4955/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=951,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4956/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=951,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4957/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=951,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4958/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=951,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4959/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=952,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4960/500000]
+ optim/total_grad_norm=1.582
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=952,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=4961/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=952,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4962/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=952,704,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4963/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=952,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4964/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=953,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4965/500000]
+ train/ActionNoiseL2Loss=0.1160
+ throughput/total_tokens=953,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=4966/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=953,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4967/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=953,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4968/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=953,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4969/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=954,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=4970/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=954,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=4971/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=954,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4972/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=954,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4973/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=954,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4974/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=955,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4975/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=955,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4976/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=955,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4977/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=955,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=4978/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=955,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4979/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=955,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4980/500000]
+ optim/total_grad_norm=1.384
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=956,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4981/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=956,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4982/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=956,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4983/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=956,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=4984/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=956,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4985/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=957,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4986/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=957,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4987/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=957,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4988/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=957,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4989/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=957,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4990/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=958,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=4991/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=958,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4992/500000]
+ train/ActionNoiseL2Loss=0.1061
+ throughput/total_tokens=958,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4993/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=958,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4994/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=958,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4995/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=959,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=4996/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=959,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4997/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=959,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4998/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=959,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=4999/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=959,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5000/500000]
+ optim/total_grad_norm=1.546
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=960,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/12 [22:24:31] INFO | >> Saving config... checkpoint.py:608
+10/12 [22:25:19] INFO | >> Saving model state... checkpoint.py:796
+10/12 [22:26:32] INFO | >> Saving optim state... checkpoint.py:811
+10/12 [22:28:04] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5001/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=960,192,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5002/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=960,384,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=5003/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=960,576,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=5004/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=960,768,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=5005/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=960,960,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=5006/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=961,152,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=5007/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=961,344,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=5008/500000]
+ train/ActionNoiseL2Loss=0.1515
+ throughput/total_tokens=961,536,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=5009/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=961,728,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=5010/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=961,920,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,074
+[step=5011/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=962,112,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5012/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=962,304,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5013/500000]
+ train/ActionNoiseL2Loss=0.1264
+ throughput/total_tokens=962,496,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5014/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=962,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5015/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=962,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5016/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=963,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5017/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=963,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5018/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=963,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5019/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=963,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5020/500000]
+ optim/total_grad_norm=0.8876
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=963,840,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=5021/500000]
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=964,032,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5022/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=964,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5023/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=964,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5024/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=964,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5025/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=964,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5026/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=964,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5027/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=965,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5028/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=965,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5029/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=965,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5030/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=965,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5031/500000]
+ train/ActionNoiseL2Loss=0.1012
+ throughput/total_tokens=965,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5032/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=966,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5033/500000]
+ train/ActionNoiseL2Loss=0.0996
+ throughput/total_tokens=966,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5034/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=966,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5035/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=966,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5036/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=966,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5037/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=967,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5038/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=967,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5039/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=967,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5040/500000]
+ optim/total_grad_norm=0.8980
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=967,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5041/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=967,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5042/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=968,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5043/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=968,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5044/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=968,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5045/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=968,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5046/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=968,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5047/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=969,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5048/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=969,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5049/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=969,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5050/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=969,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5051/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=969,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5052/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=969,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5053/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=970,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5054/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=970,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5055/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=970,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5056/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=970,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5057/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=970,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5058/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=971,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5059/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=971,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5060/500000]
+ optim/total_grad_norm=0.9589
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=971,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5061/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=971,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5062/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=971,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5063/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=972,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5064/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=972,288,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5065/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=972,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5066/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=972,672,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5067/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=972,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5068/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=973,056,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5069/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=973,248,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5070/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=973,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5071/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=973,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5072/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=973,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5073/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=974,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5074/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=974,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5075/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=974,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5076/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=974,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5077/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=974,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5078/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=974,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5079/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=975,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5080/500000]
+ optim/total_grad_norm=1.082
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=975,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5081/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=975,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5082/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=975,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5083/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=975,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5084/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=976,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5085/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=976,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5086/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=976,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5087/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=976,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5088/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=976,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5089/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=977,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5090/500000]
+ train/ActionNoiseL2Loss=0.1053
+ throughput/total_tokens=977,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5091/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=977,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5092/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=977,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5093/500000]
+ train/ActionNoiseL2Loss=0.1453
+ throughput/total_tokens=977,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5094/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=978,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5095/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=978,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5096/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=978,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5097/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=978,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5098/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=978,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5099/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=979,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5100/500000]
+ optim/total_grad_norm=1.181
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=979,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5101/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=979,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5102/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=979,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5103/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=979,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5104/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=979,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5105/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=980,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5106/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=980,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5107/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=980,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5108/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=980,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5109/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=980,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5110/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=981,120,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=5111/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=981,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5112/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=981,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5113/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=981,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5114/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=981,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5115/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=982,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5116/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=982,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5117/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=982,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5118/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=982,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5119/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=982,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5120/500000]
+ optim/total_grad_norm=0.5962
+ train/ActionNoiseL2Loss=0.0258
+ throughput/total_tokens=983,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5121/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=983,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5122/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=983,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5123/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=983,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5124/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=983,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5125/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=984,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5126/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=984,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5127/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=984,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5128/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=984,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5129/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=984,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5130/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=984,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5131/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=985,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5132/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=985,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5133/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=985,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5134/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=985,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5135/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=985,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5136/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=986,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5137/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=986,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5138/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=986,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5139/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=986,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5140/500000]
+ optim/total_grad_norm=1.031
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=986,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5141/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=987,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5142/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=987,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5143/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=987,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5144/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=987,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5145/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=987,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5146/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=988,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5147/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=988,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5148/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=988,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5149/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=988,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5150/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=988,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5151/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=988,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5152/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=989,184,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5153/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=989,376,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5154/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=989,568,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5155/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=989,760,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5156/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=989,952,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5157/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=990,144,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5158/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=990,336,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5159/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=990,528,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5160/500000]
+ optim/total_grad_norm=1.061
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=990,720,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=5161/500000]
+ train/ActionNoiseL2Loss=0.1019
+ throughput/total_tokens=990,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5162/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=991,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5163/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=991,296,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5164/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=991,488,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5165/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=991,680,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5166/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=991,872,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5167/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=992,064,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5168/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=992,256,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5169/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=992,448,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5170/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=992,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5171/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=992,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5172/500000]
+ train/ActionNoiseL2Loss=0.1105
+ throughput/total_tokens=993,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5173/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=993,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5174/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=993,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5175/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=993,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5176/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=993,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5177/500000]
+ train/ActionNoiseL2Loss=0.1089
+ throughput/total_tokens=993,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5178/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=994,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5179/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=994,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5180/500000]
+ optim/total_grad_norm=1.213
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=994,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5181/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=994,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5182/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=994,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5183/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=995,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5184/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=995,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5185/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=995,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5186/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=995,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5187/500000]
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=995,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5188/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=996,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5189/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=996,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5190/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=996,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5191/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=996,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5192/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=996,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5193/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=997,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5194/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=997,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5195/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=997,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5196/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=997,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5197/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=997,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5198/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=998,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5199/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=998,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5200/500000]
+ optim/total_grad_norm=0.8683
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=998,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5201/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=998,592,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5202/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=998,784,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5203/500000]
+ train/ActionNoiseL2Loss=0.1073
+ throughput/total_tokens=998,976,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5204/500000]
+ train/ActionNoiseL2Loss=0.1486
+ throughput/total_tokens=999,168,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5205/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=999,360,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5206/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=999,552,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5207/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=999,744,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5208/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=999,936,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5209/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,000,128,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5210/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,000,320,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=5211/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,000,512,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5212/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,000,704,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5213/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,000,896,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5214/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,001,088,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5215/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,001,280,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5216/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,001,472,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5217/500000]
+ train/ActionNoiseL2Loss=0.1263
+ throughput/total_tokens=1,001,664,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5218/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,001,856,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5219/500000]
+ train/ActionNoiseL2Loss=0.1451
+ throughput/total_tokens=1,002,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5220/500000]
+ optim/total_grad_norm=0.9051
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,002,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5221/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,002,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5222/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,002,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5223/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,002,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5224/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=1,003,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5225/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,003,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5226/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=1,003,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5227/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,003,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5228/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,003,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5229/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,003,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5230/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,004,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5231/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=1,004,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5232/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,004,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5233/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,004,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5234/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,004,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5235/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=1,005,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5236/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,005,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5237/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,005,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5238/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=1,005,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5239/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,005,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5240/500000]
+ optim/total_grad_norm=1.300
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=1,006,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5241/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,006,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5242/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,006,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5243/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=1,006,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5244/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=1,006,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5245/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,007,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5246/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=1,007,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5247/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,007,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5248/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,007,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5249/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,007,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5250/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,008,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5251/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=1,008,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5252/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,008,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5253/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,008,576,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5254/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,008,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5255/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=1,008,960,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5256/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=1,009,152,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5257/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,009,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5258/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,009,536,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5259/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=1,009,728,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5260/500000]
+ optim/total_grad_norm=0.9496
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,009,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5261/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,010,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5262/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,010,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5263/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=1,010,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5264/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,010,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5265/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,010,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5266/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,011,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5267/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,011,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5268/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,011,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5269/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,011,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5270/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,011,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5271/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,012,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5272/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,012,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5273/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,012,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5274/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,012,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5275/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,012,800,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5276/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,012,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5277/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=1,013,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5278/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=1,013,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5279/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,013,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5280/500000]
+ optim/total_grad_norm=0.9763
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,013,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5281/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,013,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5282/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,014,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5283/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,014,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5284/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=1,014,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5285/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,014,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5286/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=1,014,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5287/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,015,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5288/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,015,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5289/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=1,015,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5290/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,015,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5291/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,015,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5292/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,016,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5293/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,016,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5294/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,016,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5295/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,016,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5296/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,016,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5297/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,017,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5298/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,017,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5299/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,017,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5300/500000]
+ optim/total_grad_norm=0.9655
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,017,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5301/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=1,017,792,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5302/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,017,984,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5303/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,018,176,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5304/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,018,368,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=5305/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,018,560,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=5306/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,018,752,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5307/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=1,018,944,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5308/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=1,019,136,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5309/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,019,328,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=5310/500000]
+ train/ActionNoiseL2Loss=0.1790
+ throughput/total_tokens=1,019,520,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+ System/Peak GPU Memory (MB)=51,074
+[step=5311/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,019,712,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5312/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,019,904,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5313/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,020,096,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5314/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,020,288,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5315/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,020,480,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5316/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,020,672,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5317/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=1,020,864,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5318/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,021,056,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5319/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,021,248,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=5320/500000]
+ optim/total_grad_norm=0.9204
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,021,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5321/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,021,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5322/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,021,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5323/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,022,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5324/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,022,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5325/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,022,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5326/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=1,022,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5327/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,022,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5328/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,022,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5329/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,023,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5330/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,023,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5331/500000]
+ train/ActionNoiseL2Loss=0.1015
+ throughput/total_tokens=1,023,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5332/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,023,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5333/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,023,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5334/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=1,024,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5335/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,024,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5336/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,024,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5337/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,024,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5338/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,024,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5339/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,025,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5340/500000]
+ optim/total_grad_norm=0.6405
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,025,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5341/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,025,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5342/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=1,025,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5343/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,025,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5344/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,026,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5345/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,026,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5346/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,026,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5347/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,026,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5348/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,026,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5349/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,027,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5350/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,027,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5351/500000]
+ train/ActionNoiseL2Loss=0.1460
+ throughput/total_tokens=1,027,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5352/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,027,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5353/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=1,027,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5354/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=1,027,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5355/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,028,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5356/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=1,028,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5357/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,028,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5358/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,028,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5359/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,028,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5360/500000]
+ optim/total_grad_norm=1.173
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,029,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5361/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,029,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5362/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,029,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5363/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,029,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5364/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=1,029,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5365/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,030,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5366/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,030,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5367/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=1,030,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5368/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,030,656,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5369/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,030,848,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5370/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,031,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5371/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,031,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5372/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,031,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5373/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,031,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5374/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=1,031,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5375/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=1,032,000,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5376/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,032,192,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5377/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,032,384,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5378/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,032,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5379/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,032,768,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5380/500000]
+ optim/total_grad_norm=0.9792
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=1,032,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5381/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,033,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5382/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,033,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5383/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=1,033,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5384/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,033,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5385/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,033,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5386/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,034,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5387/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,034,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5388/500000]
+ train/ActionNoiseL2Loss=0.1529
+ throughput/total_tokens=1,034,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5389/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=1,034,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5390/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,034,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5391/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=1,035,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5392/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,035,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5393/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,035,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5394/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,035,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5395/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,035,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5396/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,036,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5397/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,036,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5398/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,036,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5399/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,036,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5400/500000]
+ optim/total_grad_norm=1.342
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=1,036,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5401/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,036,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5402/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,037,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5403/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,037,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5404/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=1,037,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5405/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,037,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5406/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,037,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5407/500000]
+ train/ActionNoiseL2Loss=0.1343
+ throughput/total_tokens=1,038,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5408/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,038,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5409/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,038,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5410/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,038,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5411/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,038,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5412/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=1,039,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5413/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,039,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5414/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,039,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5415/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,039,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5416/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=1,039,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5417/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,040,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5418/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,040,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5419/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,040,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5420/500000]
+ optim/total_grad_norm=0.7032
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,040,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5421/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=1,040,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5422/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,041,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5423/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,041,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5424/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=1,041,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5425/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,041,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5426/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,041,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5427/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,041,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5428/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,042,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5429/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,042,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5430/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,042,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5431/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,042,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5432/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,042,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5433/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,043,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5434/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,043,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5435/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,043,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5436/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,043,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5437/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,043,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5438/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,044,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5439/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,044,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5440/500000]
+ optim/total_grad_norm=0.9870
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,044,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5441/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,044,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5442/500000]
+ train/ActionNoiseL2Loss=0.1222
+ throughput/total_tokens=1,044,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5443/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,045,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5444/500000]
+ train/ActionNoiseL2Loss=0.1716
+ throughput/total_tokens=1,045,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5445/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,045,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5446/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,045,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5447/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=1,045,824,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5448/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,046,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5449/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,046,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5450/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,046,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5451/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,046,592,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5452/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,046,784,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5453/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,046,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5454/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,047,168,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5455/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,047,360,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5456/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,047,552,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5457/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,047,744,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5458/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,047,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5459/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,048,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5460/500000]
+ optim/total_grad_norm=0.8195
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,048,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5461/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,048,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5462/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=1,048,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5463/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,048,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5464/500000]
+ train/ActionNoiseL2Loss=0.1000
+ throughput/total_tokens=1,049,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5465/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,049,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5466/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,049,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5467/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,049,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5468/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,049,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5469/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,050,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5470/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,050,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5471/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,050,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5472/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,050,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5473/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=1,050,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5474/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,051,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5475/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,051,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5476/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,051,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5477/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,051,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5478/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,051,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5479/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,051,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5480/500000]
+ optim/total_grad_norm=1.049
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=1,052,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5481/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,052,352,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5482/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,052,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5483/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,052,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5484/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,052,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5485/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,053,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5486/500000]
+ train/ActionNoiseL2Loss=0.1325
+ throughput/total_tokens=1,053,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5487/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,053,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5488/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,053,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5489/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,053,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5490/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,054,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5491/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,054,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5492/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,054,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5493/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=1,054,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5494/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,054,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5495/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,055,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5496/500000]
+ train/ActionNoiseL2Loss=0.1416
+ throughput/total_tokens=1,055,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5497/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=1,055,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5498/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=1,055,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5499/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,055,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5500/500000]
+ optim/total_grad_norm=1.142
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,056,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/13 [01:23:24] INFO | >> Saving config... checkpoint.py:608
+10/13 [01:24:06] INFO | >> Saving model state... checkpoint.py:796
+10/13 [01:25:15] INFO | >> Saving optim state... checkpoint.py:811
+10/13 [01:26:47] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=5501/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,056,192,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5502/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,056,384,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=5503/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,056,576,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=5504/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,056,768,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5505/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=1,056,960,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5506/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,057,152,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5507/500000]
+ train/ActionNoiseL2Loss=0.1097
+ throughput/total_tokens=1,057,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5508/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,057,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5509/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,057,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5510/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,057,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5511/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,058,112,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5512/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,058,304,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5513/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,058,496,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5514/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=1,058,688,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5515/500000]
+ train/ActionNoiseL2Loss=0.1261
+ throughput/total_tokens=1,058,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5516/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,059,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5517/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,059,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5518/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,059,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5519/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=1,059,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5520/500000]
+ optim/total_grad_norm=1.163
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,059,840,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5521/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,060,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5522/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,060,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5523/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,060,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5524/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,060,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5525/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,060,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5526/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,060,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5527/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,061,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5528/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,061,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5529/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,061,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5530/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,061,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5531/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,061,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5532/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,062,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5533/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,062,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5534/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,062,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5535/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,062,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5536/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,062,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5537/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,063,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5538/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,063,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5539/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,063,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5540/500000]
+ optim/total_grad_norm=1.081
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=1,063,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5541/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,063,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5542/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,064,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5543/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,064,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5544/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,064,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5545/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,064,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5546/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,064,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5547/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,065,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5548/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,065,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5549/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,065,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5550/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=1,065,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5551/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,065,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5552/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,065,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5553/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,066,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5554/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,066,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5555/500000]
+ train/ActionNoiseL2Loss=0.1592
+ throughput/total_tokens=1,066,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5556/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,066,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5557/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,066,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5558/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,067,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5559/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,067,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5560/500000]
+ optim/total_grad_norm=0.9835
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,067,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5561/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,067,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5562/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,067,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5563/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,068,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5564/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,068,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5565/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,068,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5566/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,068,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5567/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=1,068,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5568/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,069,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5569/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,069,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5570/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,069,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5571/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=1,069,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5572/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,069,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5573/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,070,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5574/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,070,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5575/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=1,070,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5576/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=1,070,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5577/500000]
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=1,070,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5578/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,070,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5579/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,071,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5580/500000]
+ optim/total_grad_norm=1.336
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,071,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5581/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=1,071,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5582/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,071,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5583/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,071,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5584/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,072,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5585/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,072,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5586/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,072,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5587/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,072,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5588/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,072,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5589/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,073,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5590/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=1,073,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5591/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,073,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5592/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,073,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5593/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=1,073,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5594/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=1,074,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5595/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=1,074,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5596/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,074,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5597/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,074,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5598/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,074,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5599/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,075,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5600/500000]
+ optim/total_grad_norm=1.308
+ train/ActionNoiseL2Loss=0.1189
+ throughput/total_tokens=1,075,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5601/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=1,075,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5602/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,075,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5603/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,075,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5604/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,075,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5605/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,076,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5606/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=1,076,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5607/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,076,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5608/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,076,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5609/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,076,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5610/500000]
+ train/ActionNoiseL2Loss=0.1635
+ throughput/total_tokens=1,077,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5611/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,077,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5612/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,077,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5613/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,077,696,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5614/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,077,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5615/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,078,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5616/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=1,078,272,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5617/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,078,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5618/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,078,656,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5619/500000]
+ train/ActionNoiseL2Loss=0.1119
+ throughput/total_tokens=1,078,848,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5620/500000]
+ optim/total_grad_norm=0.9786
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=1,079,040,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5621/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,079,232,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5622/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,079,424,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5623/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,079,616,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5624/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,079,808,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5625/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,080,000,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5626/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,080,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5627/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,080,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5628/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,080,576,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5629/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,080,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5630/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,080,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5631/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,081,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5632/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,081,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5633/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,081,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5634/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,081,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5635/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,081,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5636/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,082,112,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5637/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,082,304,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5638/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,082,496,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5639/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,082,688,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5640/500000]
+ optim/total_grad_norm=1.053
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,082,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5641/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,083,072,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5642/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,083,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5643/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,083,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5644/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,083,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5645/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,083,840,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5646/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,084,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5647/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,084,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5648/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,084,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5649/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,084,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5650/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=1,084,800,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5651/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,084,992,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5652/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,085,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5653/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,085,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5654/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,085,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5655/500000]
+ train/ActionNoiseL2Loss=0.1371
+ throughput/total_tokens=1,085,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5656/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,085,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5657/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,086,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5658/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,086,336,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5659/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,086,528,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5660/500000]
+ optim/total_grad_norm=2.094
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=1,086,720,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=5661/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,086,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5662/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,087,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5663/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,087,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5664/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,087,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5665/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,087,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5666/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,087,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5667/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,088,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5668/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,088,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5669/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,088,448,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5670/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,088,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5671/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,088,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5672/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,089,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5673/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,089,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5674/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,089,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5675/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,089,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5676/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=1,089,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5677/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=1,089,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5678/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,090,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5679/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=1,090,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5680/500000]
+ optim/total_grad_norm=1.215
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,090,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5681/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,090,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5682/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,090,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5683/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=1,091,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5684/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,091,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5685/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,091,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5686/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=1,091,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5687/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=1,091,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5688/500000]
+ train/ActionNoiseL2Loss=0.1128
+ throughput/total_tokens=1,092,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5689/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,092,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5690/500000]
+ train/ActionNoiseL2Loss=0.1230
+ throughput/total_tokens=1,092,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5691/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,092,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5692/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,092,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5693/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=1,093,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5694/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,093,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5695/500000]
+ train/ActionNoiseL2Loss=0.1116
+ throughput/total_tokens=1,093,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5696/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,093,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5697/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,093,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5698/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,094,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5699/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,094,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5700/500000]
+ optim/total_grad_norm=0.8356
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,094,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5701/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,094,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5702/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,094,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5703/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=1,094,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5704/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,095,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5705/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,095,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5706/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,095,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5707/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,095,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5708/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,095,936,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5709/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,096,128,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5710/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,096,320,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=5711/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,096,512,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5712/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,096,704,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5713/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,096,896,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5714/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,097,088,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5715/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,097,280,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5716/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,097,472,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5717/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=1,097,664,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5718/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,097,856,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5719/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=1,098,048,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=5720/500000]
+ optim/total_grad_norm=1.125
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,098,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5721/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,098,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5722/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,098,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5723/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,098,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5724/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=1,099,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5725/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,099,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5726/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,099,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5727/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,099,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5728/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,099,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5729/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,099,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5730/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,100,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5731/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,100,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5732/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,100,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5733/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=1,100,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5734/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,100,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5735/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,101,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5736/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,101,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5737/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,101,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5738/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,101,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5739/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,101,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5740/500000]
+ optim/total_grad_norm=0.5603
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,102,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5741/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,102,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5742/500000]
+ train/ActionNoiseL2Loss=0.1068
+ throughput/total_tokens=1,102,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5743/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,102,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5744/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,102,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5745/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,103,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5746/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,103,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5747/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,103,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5748/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,103,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5749/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,103,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5750/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,104,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5751/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,104,192,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5752/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,104,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5753/500000]
+ train/ActionNoiseL2Loss=0.1214
+ throughput/total_tokens=1,104,576,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5754/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,104,768,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5755/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,104,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5756/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,105,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5757/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,105,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5758/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,105,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5759/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,105,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5760/500000]
+ optim/total_grad_norm=0.7849
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,105,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5761/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,106,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5762/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,106,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5763/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,106,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5764/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,106,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5765/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,106,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5766/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,107,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5767/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=1,107,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5768/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,107,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5769/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,107,648,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5770/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,107,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5771/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=1,108,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5772/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=1,108,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5773/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,108,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5774/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=1,108,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5775/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,108,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5776/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,108,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5777/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,109,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5778/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,109,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5779/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,109,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5780/500000]
+ optim/total_grad_norm=1.272
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=1,109,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5781/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,109,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5782/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,110,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5783/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,110,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5784/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,110,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5785/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,110,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5786/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,110,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5787/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,111,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5788/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,111,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5789/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,111,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5790/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,111,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5791/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,111,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5792/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,112,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5793/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,112,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5794/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,112,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5795/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,112,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5796/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,112,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5797/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,113,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5798/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,113,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5799/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,113,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5800/500000]
+ optim/total_grad_norm=0.5387
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,113,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5801/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,113,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5802/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,113,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5803/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,114,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5804/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,114,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5805/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,114,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5806/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,114,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5807/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=1,114,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5808/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,115,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5809/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,115,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5810/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,115,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=5811/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,115,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5812/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,115,904,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5813/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=1,116,096,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5814/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,116,288,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5815/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,116,480,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5816/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,116,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5817/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,116,864,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5818/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,117,056,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5819/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,117,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5820/500000]
+ optim/total_grad_norm=0.9366
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,117,440,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5821/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,117,632,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5822/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=1,117,824,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5823/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,118,016,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5824/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,118,208,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5825/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,118,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5826/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,118,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5827/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=1,118,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5828/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,118,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5829/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,119,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5830/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,119,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5831/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,119,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5832/500000]
+ train/ActionNoiseL2Loss=0.1364
+ throughput/total_tokens=1,119,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5833/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,119,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5834/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,120,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5835/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,120,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5836/500000]
+ train/ActionNoiseL2Loss=0.0348
+ throughput/total_tokens=1,120,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5837/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,120,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5838/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,120,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5839/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,121,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5840/500000]
+ optim/total_grad_norm=0.8434
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,121,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5841/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,121,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5842/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,121,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5843/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,121,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5844/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,122,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5845/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,122,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5846/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,122,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5847/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,122,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5848/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,122,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5849/500000]
+ train/ActionNoiseL2Loss=0.1092
+ throughput/total_tokens=1,123,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5850/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,123,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5851/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,123,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5852/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,123,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5853/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,123,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5854/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,123,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5855/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,124,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5856/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,124,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5857/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,124,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5858/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,124,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5859/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,124,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5860/500000]
+ optim/total_grad_norm=1.055
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=1,125,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=5861/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,125,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5862/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,125,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5863/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=1,125,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5864/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,125,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5865/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,126,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5866/500000]
+ train/ActionNoiseL2Loss=0.1145
+ throughput/total_tokens=1,126,272,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5867/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,126,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5868/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,126,656,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5869/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=1,126,848,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5870/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,127,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5871/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,127,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5872/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,127,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5873/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,127,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5874/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,127,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5875/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,128,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5876/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,128,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5877/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,128,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5878/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,128,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5879/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,128,768,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5880/500000]
+ optim/total_grad_norm=1.023
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=1,128,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5881/500000]
+ train/ActionNoiseL2Loss=0.1248
+ throughput/total_tokens=1,129,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5882/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,129,344,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5883/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,129,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5884/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,129,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5885/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,129,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5886/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,130,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5887/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=1,130,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5888/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,130,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5889/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,130,688,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5890/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,130,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5891/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,131,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5892/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,131,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5893/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,131,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5894/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,131,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5895/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,131,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5896/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,132,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5897/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,132,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5898/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,132,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5899/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,132,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5900/500000]
+ optim/total_grad_norm=0.9411
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,132,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5901/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,132,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5902/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,133,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5903/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=1,133,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5904/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=1,133,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5905/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,133,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5906/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,133,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5907/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,134,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5908/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,134,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5909/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,134,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5910/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,134,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=5911/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,134,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=5912/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=1,135,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5913/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,135,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5914/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,135,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=5915/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=1,135,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5916/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,135,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5917/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,136,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5918/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,136,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5919/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,136,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=5920/500000]
+ optim/total_grad_norm=1.501
+ train/ActionNoiseL2Loss=0.1111
+ throughput/total_tokens=1,136,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5921/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,136,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5922/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,137,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5923/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,137,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5924/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,137,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5925/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,137,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5926/500000]
+ train/ActionNoiseL2Loss=0.1034
+ throughput/total_tokens=1,137,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5927/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,137,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5928/500000]
+ train/ActionNoiseL2Loss=0.0256
+ throughput/total_tokens=1,138,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5929/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,138,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5930/500000]
+ train/ActionNoiseL2Loss=0.1081
+ throughput/total_tokens=1,138,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5931/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,138,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5932/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,138,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5933/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,139,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5934/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,139,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5935/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,139,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5936/500000]
+ train/ActionNoiseL2Loss=0.1297
+ throughput/total_tokens=1,139,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5937/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,139,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5938/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,140,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5939/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,140,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5940/500000]
+ optim/total_grad_norm=1.142
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,140,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5941/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,140,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5942/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,140,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5943/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,141,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5944/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,141,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5945/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,141,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5946/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=1,141,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5947/500000]
+ train/ActionNoiseL2Loss=0.1490
+ throughput/total_tokens=1,141,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5948/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,142,016,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=5949/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,142,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=5950/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,142,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=5951/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,142,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5952/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,142,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5953/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,142,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5954/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=1,143,168,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5955/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,143,360,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5956/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,143,552,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5957/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,143,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5958/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,143,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5959/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,144,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5960/500000]
+ optim/total_grad_norm=1.119
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=1,144,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5961/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,144,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5962/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,144,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5963/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,144,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5964/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,145,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5965/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,145,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=5966/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,145,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5967/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,145,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5968/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,145,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=5969/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,146,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=5970/500000]
+ train/ActionNoiseL2Loss=0.0260
+ throughput/total_tokens=1,146,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5971/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,146,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5972/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=1,146,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=5973/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,146,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5974/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,147,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5975/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,147,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5976/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,147,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5977/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,147,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5978/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,147,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5979/500000]
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=1,147,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5980/500000]
+ optim/total_grad_norm=1.074
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,148,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5981/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,148,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5982/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,148,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5983/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,148,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5984/500000]
+ train/ActionNoiseL2Loss=0.0293
+ throughput/total_tokens=1,148,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5985/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,149,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5986/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,149,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5987/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,149,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5988/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=1,149,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5989/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,149,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5990/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,150,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=5991/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=1,150,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5992/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,150,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5993/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,150,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5994/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,150,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5995/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,151,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5996/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=1,151,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5997/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,151,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=5998/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=1,151,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=5999/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=1,151,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6000/500000]
+ optim/total_grad_norm=1.272
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=1,152,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/13 [04:22:01] INFO | >> Saving config... checkpoint.py:608
+10/13 [04:22:44] INFO | >> Saving model state... checkpoint.py:796
+10/13 [04:23:57] INFO | >> Saving optim state... checkpoint.py:811
+10/13 [04:25:33] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6001/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,152,192,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6002/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,152,384,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=6003/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,152,576,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=6004/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,152,768,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=6005/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,152,960,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6006/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,153,152,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6007/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,153,344,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6008/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=1,153,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6009/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=1,153,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6010/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,153,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6011/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,154,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6012/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,154,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6013/500000]
+ train/ActionNoiseL2Loss=0.1100
+ throughput/total_tokens=1,154,496,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6014/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,154,688,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6015/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,154,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6016/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,155,072,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6017/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,155,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6018/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=1,155,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6019/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=1,155,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6020/500000]
+ optim/total_grad_norm=0.7663
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,155,840,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6021/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,156,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6022/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,156,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6023/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,156,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6024/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,156,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6025/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,156,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6026/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,156,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6027/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,157,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6028/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,157,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6029/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,157,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6030/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,157,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6031/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,157,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6032/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,158,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6033/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,158,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6034/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,158,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6035/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,158,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6036/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,158,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6037/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,159,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6038/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,159,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6039/500000]
+ train/ActionNoiseL2Loss=0.1417
+ throughput/total_tokens=1,159,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6040/500000]
+ optim/total_grad_norm=0.9680
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,159,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6041/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,159,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6042/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,160,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6043/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,160,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6044/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=1,160,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6045/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,160,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6046/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,160,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6047/500000]
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=1,161,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6048/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=1,161,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6049/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,161,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6050/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,161,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6051/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,161,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6052/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,161,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6053/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,162,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6054/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,162,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6055/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,162,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6056/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,162,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6057/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,162,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6058/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,163,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6059/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,163,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6060/500000]
+ optim/total_grad_norm=0.8850
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,163,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6061/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=1,163,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6062/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,163,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6063/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,164,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6064/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,164,288,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6065/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,164,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6066/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,164,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6067/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=1,164,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6068/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,165,056,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6069/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,165,248,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6070/500000]
+ train/ActionNoiseL2Loss=0.1244
+ throughput/total_tokens=1,165,440,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6071/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,165,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6072/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,165,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6073/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,166,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6074/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,166,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6075/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,166,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6076/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=1,166,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6077/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,166,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6078/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,166,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6079/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,167,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6080/500000]
+ optim/total_grad_norm=1.152
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=1,167,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6081/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,167,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6082/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,167,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6083/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,167,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6084/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,168,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6085/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,168,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6086/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,168,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6087/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,168,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6088/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,168,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6089/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,169,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6090/500000]
+ train/ActionNoiseL2Loss=0.0867
+ throughput/total_tokens=1,169,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6091/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,169,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6092/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,169,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6093/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,169,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6094/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,170,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6095/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,170,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6096/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,170,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6097/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,170,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6098/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,170,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6099/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,171,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6100/500000]
+ optim/total_grad_norm=1.018
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,171,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6101/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,171,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6102/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,171,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6103/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,171,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6104/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,171,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6105/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,172,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6106/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,172,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6107/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,172,544,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6108/500000]
+ train/ActionNoiseL2Loss=0.1024
+ throughput/total_tokens=1,172,736,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6109/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=1,172,928,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6110/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,173,120,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=6111/500000]
+ train/ActionNoiseL2Loss=0.1059
+ throughput/total_tokens=1,173,312,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6112/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,173,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6113/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,173,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6114/500000]
+ train/ActionNoiseL2Loss=0.1410
+ throughput/total_tokens=1,173,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6115/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,174,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6116/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,174,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6117/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,174,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6118/500000]
+ train/ActionNoiseL2Loss=0.1578
+ throughput/total_tokens=1,174,656,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6119/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,174,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6120/500000]
+ optim/total_grad_norm=1.203
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,175,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6121/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,175,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6122/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,175,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6123/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,175,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6124/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,175,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6125/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,176,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6126/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,176,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6127/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=1,176,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6128/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,176,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6129/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,176,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6130/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,176,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6131/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,177,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6132/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,177,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6133/500000]
+ train/ActionNoiseL2Loss=0.1196
+ throughput/total_tokens=1,177,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6134/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,177,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6135/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,177,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6136/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,178,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6137/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,178,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6138/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,178,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6139/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=1,178,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6140/500000]
+ optim/total_grad_norm=0.9210
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,178,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6141/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=1,179,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6142/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,179,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6143/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=1,179,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6144/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,179,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6145/500000]
+ train/ActionNoiseL2Loss=0.1509
+ throughput/total_tokens=1,179,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6146/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,180,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6147/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=1,180,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6148/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,180,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6149/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=1,180,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6150/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,180,800,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6151/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,180,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6152/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=1,181,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6153/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,181,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6154/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,181,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6155/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,181,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6156/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,181,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6157/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,182,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6158/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,182,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6159/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,182,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6160/500000]
+ optim/total_grad_norm=1.584
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=1,182,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6161/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,182,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6162/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,183,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6163/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,183,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6164/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=1,183,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6165/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,183,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6166/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,183,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6167/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,184,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6168/500000]
+ train/ActionNoiseL2Loss=0.1636
+ throughput/total_tokens=1,184,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6169/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,184,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6170/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,184,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6171/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,184,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6172/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=1,185,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6173/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,185,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6174/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,185,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6175/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,185,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6176/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=1,185,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6177/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,185,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6178/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=1,186,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6179/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,186,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6180/500000]
+ optim/total_grad_norm=1.565
+ train/ActionNoiseL2Loss=0.1596
+ throughput/total_tokens=1,186,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6181/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=1,186,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6182/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,186,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6183/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,187,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6184/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,187,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6185/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,187,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6186/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=1,187,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6187/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,187,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6188/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,188,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6189/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,188,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6190/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,188,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6191/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,188,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6192/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,188,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6193/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,189,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6194/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=1,189,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6195/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,189,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6196/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,189,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6197/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,189,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6198/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=1,190,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6199/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,190,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6200/500000]
+ optim/total_grad_norm=0.8481
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,190,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6201/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,190,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6202/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,190,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6203/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,190,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6204/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,191,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6205/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=1,191,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6206/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,191,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6207/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,191,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6208/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,191,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6209/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,192,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6210/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=1,192,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6211/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,192,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6212/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=1,192,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6213/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=1,192,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6214/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,193,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6215/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,193,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6216/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,193,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6217/500000]
+ train/ActionNoiseL2Loss=0.1350
+ throughput/total_tokens=1,193,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6218/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,193,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6219/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=1,194,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6220/500000]
+ optim/total_grad_norm=0.7257
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,194,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6221/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,194,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6222/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,194,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6223/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,194,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6224/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,195,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6225/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,195,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6226/500000]
+ train/ActionNoiseL2Loss=0.1349
+ throughput/total_tokens=1,195,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6227/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,195,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6228/500000]
+ train/ActionNoiseL2Loss=0.1388
+ throughput/total_tokens=1,195,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6229/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,195,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6230/500000]
+ train/ActionNoiseL2Loss=0.1122
+ throughput/total_tokens=1,196,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6231/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,196,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6232/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,196,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6233/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,196,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6234/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,196,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6235/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=1,197,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6236/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,197,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6237/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,197,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6238/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,197,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6239/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,197,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6240/500000]
+ optim/total_grad_norm=0.6915
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,198,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6241/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,198,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6242/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,198,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6243/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,198,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6244/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,198,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6245/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,199,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6246/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,199,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6247/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,199,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6248/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,199,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6249/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=1,199,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6250/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,200,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6251/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,200,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6252/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,200,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6253/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,200,576,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6254/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,200,768,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6255/500000]
+ train/ActionNoiseL2Loss=0.1103
+ throughput/total_tokens=1,200,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6256/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,201,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6257/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,201,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6258/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,201,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6259/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,201,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6260/500000]
+ optim/total_grad_norm=0.9684
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,201,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=6261/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,202,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6262/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,202,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6263/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,202,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6264/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,202,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6265/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,202,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6266/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,203,072,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6267/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=1,203,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6268/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,203,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6269/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,203,648,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6270/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,203,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6271/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,204,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6272/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,204,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6273/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,204,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6274/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,204,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6275/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,204,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6276/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,204,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6277/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=1,205,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6278/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,205,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6279/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,205,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6280/500000]
+ optim/total_grad_norm=0.7997
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,205,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6281/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=1,205,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6282/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,206,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6283/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,206,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6284/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,206,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6285/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,206,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6286/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,206,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6287/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=1,207,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6288/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,207,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6289/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,207,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6290/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=1,207,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6291/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,207,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6292/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,208,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6293/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,208,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6294/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,208,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6295/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,208,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6296/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,208,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6297/500000]
+ train/ActionNoiseL2Loss=0.1252
+ throughput/total_tokens=1,209,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6298/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,209,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6299/500000]
+ train/ActionNoiseL2Loss=0.1161
+ throughput/total_tokens=1,209,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6300/500000]
+ optim/total_grad_norm=0.9053
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=1,209,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6301/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,209,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6302/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,209,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6303/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,210,176,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6304/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,210,368,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6305/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,210,560,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6306/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,210,752,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6307/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,210,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6308/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,211,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6309/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,211,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6310/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,211,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=6311/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,211,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6312/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,211,904,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6313/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,212,096,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6314/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,212,288,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6315/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,212,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6316/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,212,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6317/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,212,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6318/500000]
+ train/ActionNoiseL2Loss=0.1027
+ throughput/total_tokens=1,213,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6319/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,213,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6320/500000]
+ optim/total_grad_norm=0.8354
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,213,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6321/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,213,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6322/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,213,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6323/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,214,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6324/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=1,214,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6325/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,214,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6326/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,214,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6327/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,214,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6328/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,214,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6329/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,215,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6330/500000]
+ train/ActionNoiseL2Loss=0.1101
+ throughput/total_tokens=1,215,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6331/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,215,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6332/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,215,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6333/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,215,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6334/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,216,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6335/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=1,216,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6336/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,216,512,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6337/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,216,704,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6338/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,216,896,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6339/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,217,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6340/500000]
+ optim/total_grad_norm=0.7078
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,217,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6341/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,217,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6342/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,217,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6343/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=1,217,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6344/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,218,048,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6345/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,218,240,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6346/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=1,218,432,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6347/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,218,624,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6348/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=1,218,816,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6349/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,219,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6350/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=1,219,200,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6351/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,219,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6352/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=1,219,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6353/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,219,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6354/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,219,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6355/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,220,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6356/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,220,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6357/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,220,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6358/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,220,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6359/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,220,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6360/500000]
+ optim/total_grad_norm=1.611
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=1,221,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6361/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,221,312,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6362/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,221,504,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6363/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,221,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6364/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,221,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6365/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=1,222,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6366/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,222,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6367/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,222,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6368/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,222,656,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6369/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=1,222,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6370/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,223,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6371/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,223,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6372/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,223,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6373/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=1,223,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6374/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,223,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6375/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,224,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6376/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,224,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6377/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,224,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6378/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,224,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6379/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,224,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6380/500000]
+ optim/total_grad_norm=0.9498
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=1,224,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6381/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,225,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6382/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,225,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6383/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,225,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6384/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,225,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6385/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,225,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6386/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,226,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6387/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,226,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6388/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,226,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6389/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,226,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6390/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,226,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6391/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=1,227,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6392/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,227,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6393/500000]
+ train/ActionNoiseL2Loss=0.1411
+ throughput/total_tokens=1,227,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6394/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,227,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6395/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,227,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6396/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,228,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6397/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,228,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6398/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,228,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6399/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,228,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6400/500000]
+ optim/total_grad_norm=0.7803
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,228,800,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6401/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,228,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6402/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,229,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6403/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,229,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6404/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,229,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6405/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,229,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6406/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,229,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6407/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,230,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6408/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,230,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6409/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,230,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6410/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,230,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6411/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,230,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6412/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,231,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6413/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,231,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6414/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,231,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6415/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,231,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6416/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=1,231,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6417/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=1,232,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6418/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,232,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6419/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,232,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6420/500000]
+ optim/total_grad_norm=1.323
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=1,232,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6421/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,232,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6422/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,233,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6423/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,233,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6424/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,233,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6425/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,233,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6426/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,233,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6427/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,233,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6428/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,234,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6429/500000]
+ train/ActionNoiseL2Loss=0.1001
+ throughput/total_tokens=1,234,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6430/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,234,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6431/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,234,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6432/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,234,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6433/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,235,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6434/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,235,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6435/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,235,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6436/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,235,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6437/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,235,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6438/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,236,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6439/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,236,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6440/500000]
+ optim/total_grad_norm=1.067
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,236,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6441/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,236,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6442/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,236,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6443/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,237,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6444/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,237,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6445/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,237,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6446/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,237,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6447/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,237,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6448/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,238,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6449/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,238,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6450/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,238,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6451/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,238,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6452/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,238,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6453/500000]
+ train/ActionNoiseL2Loss=0.1047
+ throughput/total_tokens=1,238,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6454/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,239,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6455/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,239,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6456/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,239,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6457/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,239,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6458/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,239,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6459/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,240,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6460/500000]
+ optim/total_grad_norm=1.942
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=1,240,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6461/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,240,512,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6462/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,240,704,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6463/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,240,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6464/500000]
+ train/ActionNoiseL2Loss=0.0228
+ throughput/total_tokens=1,241,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6465/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,241,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6466/500000]
+ train/ActionNoiseL2Loss=0.1153
+ throughput/total_tokens=1,241,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6467/500000]
+ train/ActionNoiseL2Loss=0.1017
+ throughput/total_tokens=1,241,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6468/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,241,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6469/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,242,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6470/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,242,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6471/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,242,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6472/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,242,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6473/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,242,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6474/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=1,243,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6475/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,243,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6476/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,243,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6477/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,243,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6478/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,243,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6479/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,243,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6480/500000]
+ optim/total_grad_norm=0.8023
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,244,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6481/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,244,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6482/500000]
+ train/ActionNoiseL2Loss=0.0289
+ throughput/total_tokens=1,244,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6483/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,244,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6484/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,244,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6485/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,245,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6486/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,245,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6487/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,245,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6488/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,245,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6489/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,245,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6490/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,246,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6491/500000]
+ train/ActionNoiseL2Loss=0.1148
+ throughput/total_tokens=1,246,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6492/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,246,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6493/500000]
+ train/ActionNoiseL2Loss=0.0230
+ throughput/total_tokens=1,246,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6494/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,246,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6495/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,247,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6496/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,247,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6497/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,247,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6498/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,247,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6499/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,247,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6500/500000]
+ optim/total_grad_norm=0.7270
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=1,248,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/13 [07:20:58] INFO | >> Saving config... checkpoint.py:608
+10/13 [07:21:31] INFO | >> Saving model state... checkpoint.py:796
+10/13 [07:22:45] INFO | >> Saving optim state... checkpoint.py:811
+10/13 [07:24:17] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=6501/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,248,192,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=6502/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,248,384,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=6503/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=1,248,576,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=6504/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,248,768,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=6505/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=1,248,960,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=6506/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,249,152,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=6507/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,249,344,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6508/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,249,536,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=6509/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,249,728,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=6510/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,249,920,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=51,074
+[step=6511/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,250,112,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=6512/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,250,304,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=6513/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,250,496,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=6514/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,250,688,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=6515/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,250,880,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=6516/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,251,072,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=6517/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,251,264,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=6518/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,251,456,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6519/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,251,648,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6520/500000]
+ optim/total_grad_norm=2.047
+ train/ActionNoiseL2Loss=0.1256
+ throughput/total_tokens=1,251,840,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,074
+[step=6521/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=1,252,032,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6522/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,252,224,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6523/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,252,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6524/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,252,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6525/500000]
+ train/ActionNoiseL2Loss=0.0158
+ throughput/total_tokens=1,252,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6526/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,252,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6527/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,253,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6528/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,253,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6529/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,253,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6530/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,253,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6531/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,253,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6532/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,254,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6533/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,254,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6534/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,254,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6535/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,254,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6536/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,254,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6537/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,255,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6538/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=1,255,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6539/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,255,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6540/500000]
+ optim/total_grad_norm=0.9544
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,255,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6541/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,255,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6542/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,256,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6543/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,256,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6544/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,256,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6545/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,256,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6546/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,256,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6547/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,257,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6548/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,257,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6549/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,257,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6550/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=1,257,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6551/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,257,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6552/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,257,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6553/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,258,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6554/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,258,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6555/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,258,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6556/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,258,752,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6557/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,258,944,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6558/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,259,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6559/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,259,328,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6560/500000]
+ optim/total_grad_norm=1.498
+ train/ActionNoiseL2Loss=0.1138
+ throughput/total_tokens=1,259,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6561/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=1,259,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6562/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,259,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6563/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,260,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6564/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,260,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6565/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,260,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6566/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,260,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6567/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,260,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6568/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,261,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6569/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,261,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6570/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,261,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6571/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,261,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6572/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,261,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6573/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,262,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6574/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,262,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6575/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,262,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6576/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,262,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6577/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,262,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6578/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,262,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6579/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=1,263,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6580/500000]
+ optim/total_grad_norm=0.9534
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=1,263,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6581/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,263,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6582/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,263,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6583/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,263,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6584/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,264,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6585/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,264,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6586/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=1,264,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6587/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,264,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6588/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,264,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6589/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,265,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6590/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,265,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6591/500000]
+ train/ActionNoiseL2Loss=0.1299
+ throughput/total_tokens=1,265,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6592/500000]
+ train/ActionNoiseL2Loss=0.0937
+ throughput/total_tokens=1,265,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6593/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,265,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6594/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,266,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6595/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=1,266,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6596/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,266,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6597/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,266,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6598/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,266,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6599/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=1,267,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6600/500000]
+ optim/total_grad_norm=1.577
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=1,267,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6601/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,267,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6602/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,267,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6603/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,267,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6604/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=1,267,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6605/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,268,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6606/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=1,268,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6607/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,268,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6608/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,268,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6609/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,268,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6610/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,269,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6611/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,269,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6612/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,269,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6613/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,269,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6614/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,269,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6615/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,270,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6616/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,270,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6617/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,270,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6618/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,270,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6619/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,270,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6620/500000]
+ optim/total_grad_norm=0.7401
+ train/ActionNoiseL2Loss=0.0794
+ throughput/total_tokens=1,271,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6621/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,271,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6622/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=1,271,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6623/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,271,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6624/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=1,271,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6625/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,272,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6626/500000]
+ train/ActionNoiseL2Loss=0.1009
+ throughput/total_tokens=1,272,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6627/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,272,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6628/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,272,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6629/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,272,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6630/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,272,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6631/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,273,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6632/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,273,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6633/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,273,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6634/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,273,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6635/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,273,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6636/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,274,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6637/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,274,304,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6638/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,274,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6639/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,274,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6640/500000]
+ optim/total_grad_norm=0.7150
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,274,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6641/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,275,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6642/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,275,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6643/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,275,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6644/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,275,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6645/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,275,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6646/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,276,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6647/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,276,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6648/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,276,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6649/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=1,276,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6650/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,276,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6651/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=1,276,992,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=6652/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,277,184,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6653/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,277,376,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6654/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,277,568,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6655/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,277,760,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6656/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,277,952,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6657/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,278,144,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6658/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,278,336,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6659/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,278,528,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6660/500000]
+ optim/total_grad_norm=0.8674
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,278,720,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+ System/Peak GPU Memory (MB)=51,074
+[step=6661/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,278,912,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6662/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,279,104,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6663/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,279,296,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6664/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,279,488,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6665/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,279,680,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6666/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,279,872,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6667/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,280,064,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=6668/500000]
+ train/ActionNoiseL2Loss=0.1037
+ throughput/total_tokens=1,280,256,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6669/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,280,448,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=6670/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,280,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6671/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,280,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6672/500000]
+ train/ActionNoiseL2Loss=0.1282
+ throughput/total_tokens=1,281,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6673/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=1,281,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6674/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,281,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6675/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=1,281,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6676/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,281,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6677/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,281,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6678/500000]
+ train/ActionNoiseL2Loss=0.1124
+ throughput/total_tokens=1,282,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6679/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,282,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6680/500000]
+ optim/total_grad_norm=1.033
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,282,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6681/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,282,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6682/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,282,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6683/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,283,136,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6684/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=1,283,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6685/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,283,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6686/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,283,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6687/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=1,283,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6688/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=1,284,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6689/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=1,284,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6690/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,284,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6691/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,284,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6692/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,284,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6693/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,285,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6694/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,285,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6695/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,285,440,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6696/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,285,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6697/500000]
+ train/ActionNoiseL2Loss=0.1594
+ throughput/total_tokens=1,285,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6698/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,286,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6699/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,286,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6700/500000]
+ optim/total_grad_norm=0.8638
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,286,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6701/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=1,286,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6702/500000]
+ train/ActionNoiseL2Loss=0.1328
+ throughput/total_tokens=1,286,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6703/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,286,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6704/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,287,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6705/500000]
+ train/ActionNoiseL2Loss=0.1329
+ throughput/total_tokens=1,287,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6706/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,287,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6707/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,287,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6708/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,287,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6709/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,288,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6710/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,288,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6711/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,288,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6712/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,288,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6713/500000]
+ train/ActionNoiseL2Loss=0.1033
+ throughput/total_tokens=1,288,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6714/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,289,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6715/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,289,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6716/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,289,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6717/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,289,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6718/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,289,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6719/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,290,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6720/500000]
+ optim/total_grad_norm=1.066
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,290,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6721/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,290,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6722/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,290,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6723/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,290,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6724/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=1,291,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6725/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=1,291,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6726/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,291,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6727/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,291,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6728/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,291,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6729/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,291,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6730/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,292,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6731/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=1,292,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6732/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,292,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6733/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,292,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6734/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,292,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6735/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,293,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6736/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,293,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6737/500000]
+ train/ActionNoiseL2Loss=0.1188
+ throughput/total_tokens=1,293,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6738/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,293,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6739/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,293,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6740/500000]
+ optim/total_grad_norm=0.7627
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,294,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6741/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,294,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6742/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,294,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6743/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,294,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6744/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,294,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6745/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=1,295,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6746/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,295,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6747/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=1,295,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6748/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,295,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6749/500000]
+ train/ActionNoiseL2Loss=0.0982
+ throughput/total_tokens=1,295,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6750/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,296,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6751/500000]
+ train/ActionNoiseL2Loss=0.1206
+ throughput/total_tokens=1,296,192,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6752/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,296,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6753/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,296,576,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6754/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,296,768,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6755/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,296,960,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6756/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,297,152,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6757/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,297,344,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6758/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,297,536,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6759/500000]
+ train/ActionNoiseL2Loss=0.1212
+ throughput/total_tokens=1,297,728,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6760/500000]
+ optim/total_grad_norm=0.7885
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,297,920,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=6761/500000]
+ train/ActionNoiseL2Loss=0.1625
+ throughput/total_tokens=1,298,112,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6762/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=1,298,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6763/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,298,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6764/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,298,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6765/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=1,298,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6766/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,299,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6767/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,299,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6768/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,299,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6769/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,299,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6770/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,299,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6771/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,300,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6772/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,300,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6773/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,300,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6774/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,300,608,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6775/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,300,800,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6776/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,300,992,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6777/500000]
+ train/ActionNoiseL2Loss=0.0989
+ throughput/total_tokens=1,301,184,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6778/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,301,376,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6779/500000]
+ train/ActionNoiseL2Loss=0.1164
+ throughput/total_tokens=1,301,568,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6780/500000]
+ optim/total_grad_norm=1.232
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,301,760,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6781/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,301,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6782/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=1,302,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6783/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,302,336,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6784/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=1,302,528,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6785/500000]
+ train/ActionNoiseL2Loss=0.1414
+ throughput/total_tokens=1,302,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6786/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,302,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6787/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,303,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6788/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,303,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6789/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,303,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6790/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,303,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6791/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=1,303,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6792/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,304,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6793/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,304,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6794/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,304,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6795/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,304,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6796/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,304,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6797/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,305,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6798/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,305,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6799/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,305,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6800/500000]
+ optim/total_grad_norm=1.364
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=1,305,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6801/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,305,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6802/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,305,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6803/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,306,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6804/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=1,306,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6805/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,306,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6806/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,306,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6807/500000]
+ train/ActionNoiseL2Loss=0.1219
+ throughput/total_tokens=1,306,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6808/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=1,307,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6809/500000]
+ train/ActionNoiseL2Loss=0.1152
+ throughput/total_tokens=1,307,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6810/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,307,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=6811/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,307,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6812/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,307,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6813/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,308,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6814/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=1,308,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6815/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,308,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6816/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,308,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6817/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,308,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6818/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,309,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6819/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,309,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6820/500000]
+ optim/total_grad_norm=0.6728
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,309,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6821/500000]
+ train/ActionNoiseL2Loss=0.1210
+ throughput/total_tokens=1,309,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6822/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,309,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6823/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,310,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6824/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=1,310,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6825/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,310,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6826/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,310,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6827/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,310,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6828/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,310,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6829/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,311,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6830/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,311,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6831/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,311,552,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6832/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,311,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6833/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,311,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6834/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,312,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6835/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,312,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6836/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,312,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6837/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,312,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6838/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,312,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6839/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,313,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6840/500000]
+ optim/total_grad_norm=0.8406
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,313,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6841/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=1,313,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6842/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,313,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6843/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,313,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6844/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,314,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6845/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=1,314,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6846/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,314,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6847/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,314,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6848/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,314,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6849/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,315,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6850/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,315,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6851/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,315,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6852/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,315,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6853/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,315,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6854/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=1,315,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6855/500000]
+ train/ActionNoiseL2Loss=0.1157
+ throughput/total_tokens=1,316,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6856/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,316,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6857/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,316,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6858/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,316,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6859/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=1,316,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6860/500000]
+ optim/total_grad_norm=0.7065
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,317,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=6861/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,317,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6862/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,317,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6863/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=1,317,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6864/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,317,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6865/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,318,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6866/500000]
+ train/ActionNoiseL2Loss=0.0973
+ throughput/total_tokens=1,318,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6867/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,318,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6868/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,318,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6869/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,318,848,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6870/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,319,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6871/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,319,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6872/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,319,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6873/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,319,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6874/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,319,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6875/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=1,320,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6876/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,320,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6877/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,320,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6878/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,320,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6879/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=1,320,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6880/500000]
+ optim/total_grad_norm=0.7664
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,320,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6881/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,321,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6882/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,321,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6883/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,321,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6884/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,321,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6885/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,321,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6886/500000]
+ train/ActionNoiseL2Loss=0.1227
+ throughput/total_tokens=1,322,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6887/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,322,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6888/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,322,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6889/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,322,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6890/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=1,322,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6891/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,323,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6892/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,323,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6893/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,323,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6894/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,323,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6895/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=1,323,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6896/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,324,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6897/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,324,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6898/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,324,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6899/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,324,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6900/500000]
+ optim/total_grad_norm=1.024
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,324,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6901/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=1,324,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6902/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,325,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6903/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,325,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6904/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,325,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6905/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,325,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6906/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,325,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6907/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,326,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6908/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,326,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6909/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,326,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6910/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,326,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6911/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,326,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6912/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,327,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6913/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,327,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6914/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,327,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6915/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,327,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6916/500000]
+ train/ActionNoiseL2Loss=0.1032
+ throughput/total_tokens=1,327,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6917/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,328,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6918/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,328,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6919/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,328,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6920/500000]
+ optim/total_grad_norm=1.102
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,328,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6921/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,328,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6922/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,329,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6923/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,329,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6924/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,329,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6925/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,329,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6926/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,329,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6927/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,329,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6928/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,330,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6929/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,330,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6930/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,330,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6931/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,330,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6932/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,330,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6933/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=1,331,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6934/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,331,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6935/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,331,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6936/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,331,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6937/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,331,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6938/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,332,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6939/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,332,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6940/500000]
+ optim/total_grad_norm=0.6449
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,332,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6941/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,332,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6942/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,332,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6943/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,333,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6944/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=1,333,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6945/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,333,440,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6946/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,333,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=6947/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,333,824,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6948/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,334,016,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6949/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,334,208,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=6950/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,334,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=6951/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,334,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=6952/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,334,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6953/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,334,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6954/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,335,168,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6955/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,335,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6956/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,335,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6957/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,335,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6958/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,335,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=6959/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,336,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=6960/500000]
+ optim/total_grad_norm=0.5599
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,336,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=6961/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,336,512,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6962/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,336,704,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6963/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,336,896,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6964/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=1,337,088,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6965/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,337,280,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6966/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,337,472,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6967/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,337,664,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6968/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,337,856,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=6969/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=1,338,048,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=6970/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=1,338,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6971/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,338,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6972/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,338,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6973/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,338,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6974/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=1,339,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=6975/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,339,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6976/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,339,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6977/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,339,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6978/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,339,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6979/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,339,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6980/500000]
+ optim/total_grad_norm=1.742
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,340,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6981/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,340,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6982/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,340,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6983/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,340,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6984/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=1,340,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6985/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,341,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=6986/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,341,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6987/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,341,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6988/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,341,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6989/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,341,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6990/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,342,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=6991/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,342,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6992/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,342,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6993/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,342,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=6994/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,342,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6995/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,343,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6996/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,343,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6997/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,343,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=6998/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,343,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=6999/500000]
+ train/ActionNoiseL2Loss=0.1303
+ throughput/total_tokens=1,343,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7000/500000]
+ optim/total_grad_norm=0.9858
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,344,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/13 [10:19:33] INFO | >> Saving config... checkpoint.py:608
+10/13 [10:20:14] INFO | >> Saving model state... checkpoint.py:796
+10/13 [10:21:28] INFO | >> Saving optim state... checkpoint.py:811
+10/13 [10:23:00] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7001/500000]
+ train/ActionNoiseL2Loss=0.1239
+ throughput/total_tokens=1,344,192,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=7002/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,344,384,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=7003/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,344,576,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=7004/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=1,344,768,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=7005/500000]
+ train/ActionNoiseL2Loss=0.0298
+ throughput/total_tokens=1,344,960,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=7006/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,345,152,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=7007/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,345,344,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7008/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,345,536,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7009/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,345,728,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7010/500000]
+ train/ActionNoiseL2Loss=0.1369
+ throughput/total_tokens=1,345,920,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=7011/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,346,112,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7012/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,346,304,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7013/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,346,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7014/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,346,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7015/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,346,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7016/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,347,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7017/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=1,347,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7018/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,347,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7019/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,347,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7020/500000]
+ optim/total_grad_norm=0.6040
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,347,840,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=7021/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,348,032,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7022/500000]
+ train/ActionNoiseL2Loss=0.1076
+ throughput/total_tokens=1,348,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7023/500000]
+ train/ActionNoiseL2Loss=0.1332
+ throughput/total_tokens=1,348,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7024/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,348,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7025/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,348,800,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7026/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,348,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7027/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,349,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7028/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,349,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7029/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,349,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7030/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,349,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7031/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,349,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7032/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,350,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7033/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,350,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7034/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,350,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7035/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=1,350,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7036/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,350,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7037/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,351,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7038/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,351,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7039/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,351,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7040/500000]
+ optim/total_grad_norm=1.314
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,351,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7041/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,351,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7042/500000]
+ train/ActionNoiseL2Loss=0.1115
+ throughput/total_tokens=1,352,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7043/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,352,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7044/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,352,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7045/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,352,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7046/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,352,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7047/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,353,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7048/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,353,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7049/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=1,353,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7050/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,353,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7051/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,353,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7052/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=1,353,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7053/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,354,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7054/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,354,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7055/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,354,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7056/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=1,354,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7057/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,354,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7058/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,355,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7059/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,355,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7060/500000]
+ optim/total_grad_norm=0.5719
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,355,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7061/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,355,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7062/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,355,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7063/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,356,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7064/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,356,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7065/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=1,356,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7066/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,356,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7067/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,356,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7068/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,357,056,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7069/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=1,357,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7070/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,357,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7071/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,357,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7072/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,357,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7073/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,358,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7074/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,358,208,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7075/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,358,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7076/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,358,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7077/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,358,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7078/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,358,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7079/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,359,168,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7080/500000]
+ optim/total_grad_norm=0.7593
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,359,360,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7081/500000]
+ train/ActionNoiseL2Loss=0.1247
+ throughput/total_tokens=1,359,552,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7082/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,359,744,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7083/500000]
+ train/ActionNoiseL2Loss=0.1250
+ throughput/total_tokens=1,359,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7084/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,360,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7085/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,360,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7086/500000]
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=1,360,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7087/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,360,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7088/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,360,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7089/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,361,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7090/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=1,361,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7091/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,361,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7092/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,361,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7093/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,361,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7094/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,362,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7095/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,362,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7096/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,362,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7097/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,362,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7098/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,362,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7099/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,363,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7100/500000]
+ optim/total_grad_norm=1.279
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,363,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7101/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,363,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7102/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,363,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7103/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,363,776,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7104/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,363,968,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7105/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,364,160,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7106/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,364,352,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7107/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,364,544,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7108/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,364,736,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7109/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,364,928,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7110/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,365,120,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=7111/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,365,312,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7112/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,365,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7113/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,365,696,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7114/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=1,365,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7115/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,366,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7116/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,366,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7117/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,366,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7118/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,366,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7119/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,366,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7120/500000]
+ optim/total_grad_norm=1.175
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=1,367,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7121/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,367,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7122/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,367,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7123/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,367,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7124/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=1,367,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7125/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,368,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7126/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,368,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7127/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,368,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7128/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,368,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7129/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,368,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7130/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,368,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7131/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,369,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7132/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,369,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7133/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,369,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7134/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,369,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7135/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,369,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7136/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,370,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7137/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,370,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7138/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,370,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7139/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,370,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7140/500000]
+ optim/total_grad_norm=1.056
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,370,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7141/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,371,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7142/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,371,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7143/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=1,371,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7144/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,371,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7145/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,371,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7146/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,372,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7147/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,372,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7148/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,372,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7149/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,372,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7150/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,372,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7151/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,372,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7152/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,373,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7153/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,373,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7154/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,373,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7155/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,373,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7156/500000]
+ train/ActionNoiseL2Loss=0.1005
+ throughput/total_tokens=1,373,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7157/500000]
+ train/ActionNoiseL2Loss=0.1023
+ throughput/total_tokens=1,374,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7158/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,374,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7159/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,374,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7160/500000]
+ optim/total_grad_norm=0.7067
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,374,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7161/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=1,374,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7162/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=1,375,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7163/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,375,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7164/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,375,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7165/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,375,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7166/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,375,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7167/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,376,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7168/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=1,376,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7169/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=1,376,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7170/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,376,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7171/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,376,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7172/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=1,377,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7173/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,377,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7174/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,377,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7175/500000]
+ train/ActionNoiseL2Loss=0.1352
+ throughput/total_tokens=1,377,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7176/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,377,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7177/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,377,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7178/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=1,378,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7179/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=1,378,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7180/500000]
+ optim/total_grad_norm=0.7979
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,378,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7181/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=1,378,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7182/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=1,378,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7183/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,379,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7184/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,379,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7185/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,379,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7186/500000]
+ train/ActionNoiseL2Loss=0.1198
+ throughput/total_tokens=1,379,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7187/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,379,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7188/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,380,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7189/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,380,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7190/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,380,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7191/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=1,380,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7192/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,380,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7193/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,381,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7194/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,381,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7195/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,381,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7196/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,381,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7197/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,381,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7198/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,382,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7199/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,382,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7200/500000]
+ optim/total_grad_norm=1.941
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=1,382,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7201/500000]
+ train/ActionNoiseL2Loss=0.1372
+ throughput/total_tokens=1,382,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7202/500000]
+ train/ActionNoiseL2Loss=0.1172
+ throughput/total_tokens=1,382,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7203/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,382,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7204/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=1,383,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7205/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=1,383,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7206/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,383,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7207/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,383,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7208/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,383,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7209/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,384,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7210/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,384,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7211/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,384,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7212/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,384,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7213/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,384,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7214/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,385,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7215/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,385,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7216/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=1,385,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7217/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=1,385,664,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7218/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,385,856,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7219/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,386,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7220/500000]
+ optim/total_grad_norm=1.286
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,386,240,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7221/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=1,386,432,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7222/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,386,624,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7223/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,386,816,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7224/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,387,008,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7225/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,387,200,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7226/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,387,392,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7227/500000]
+ train/ActionNoiseL2Loss=0.1107
+ throughput/total_tokens=1,387,584,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7228/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,387,776,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7229/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,387,968,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7230/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,388,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7231/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,388,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7232/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,388,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7233/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,388,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7234/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,388,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7235/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,389,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7236/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,389,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7237/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,389,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7238/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,389,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7239/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,389,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7240/500000]
+ optim/total_grad_norm=0.7112
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,390,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7241/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,390,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7242/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,390,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7243/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,390,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7244/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,390,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7245/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,391,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7246/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,391,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7247/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,391,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7248/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=1,391,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7249/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,391,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7250/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,392,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7251/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,392,192,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7252/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,392,384,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7253/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,392,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7254/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=1,392,768,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7255/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,392,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7256/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,393,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7257/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,393,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7258/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,393,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7259/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,393,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7260/500000]
+ optim/total_grad_norm=1.323
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=1,393,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7261/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,394,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7262/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,394,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7263/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,394,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7264/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,394,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7265/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,394,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7266/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,395,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7267/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,395,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7268/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,395,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7269/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,395,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7270/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,395,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7271/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,396,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7272/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,396,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7273/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,396,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7274/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,396,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7275/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=1,396,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7276/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,396,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7277/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=1,397,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7278/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,397,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7279/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,397,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7280/500000]
+ optim/total_grad_norm=0.7861
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,397,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7281/500000]
+ train/ActionNoiseL2Loss=0.0905
+ throughput/total_tokens=1,397,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7282/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,398,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7283/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,398,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7284/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,398,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7285/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,398,720,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7286/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,398,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7287/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,399,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7288/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=1,399,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7289/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,399,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7290/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,399,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7291/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,399,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7292/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,400,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7293/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,400,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7294/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,400,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7295/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,400,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7296/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,400,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7297/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,401,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7298/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,401,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7299/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=1,401,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7300/500000]
+ optim/total_grad_norm=0.8311
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,401,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7301/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,401,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7302/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=1,401,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7303/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,402,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7304/500000]
+ train/ActionNoiseL2Loss=0.1006
+ throughput/total_tokens=1,402,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7305/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,402,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7306/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,402,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7307/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,402,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7308/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,403,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7309/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=1,403,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7310/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,403,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7311/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,403,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7312/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,403,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7313/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=1,404,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7314/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,404,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7315/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,404,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7316/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,404,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7317/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=1,404,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7318/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,405,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7319/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,405,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7320/500000]
+ optim/total_grad_norm=1.239
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=1,405,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7321/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,405,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7322/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,405,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7323/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,406,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7324/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,406,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7325/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,406,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7326/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,406,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7327/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,406,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7328/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,406,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7329/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,407,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7330/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,407,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7331/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,407,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7332/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,407,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7333/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,407,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7334/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,408,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7335/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=1,408,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7336/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,408,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7337/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,408,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7338/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,408,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7339/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,409,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7340/500000]
+ optim/total_grad_norm=0.7994
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,409,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7341/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,409,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7342/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,409,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7343/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,409,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7344/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=1,410,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7345/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,410,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7346/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,410,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7347/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,410,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7348/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,410,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7349/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,411,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7350/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,411,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7351/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,411,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7352/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,411,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7353/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,411,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7354/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,411,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7355/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,412,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7356/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,412,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7357/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,412,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7358/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,412,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7359/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,412,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7360/500000]
+ optim/total_grad_norm=0.6978
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,413,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7361/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,413,312,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7362/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,413,504,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7363/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,413,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7364/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,413,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7365/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,414,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7366/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,414,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7367/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,414,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7368/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,414,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7369/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,414,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7370/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,415,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7371/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,415,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7372/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,415,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7373/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,415,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7374/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=1,415,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7375/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,416,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7376/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=1,416,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7377/500000]
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=1,416,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7378/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,416,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7379/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,416,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7380/500000]
+ optim/total_grad_norm=0.8140
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,416,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7381/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,417,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7382/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,417,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7383/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,417,536,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7384/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,417,728,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7385/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,417,920,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7386/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,418,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7387/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,418,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7388/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,418,496,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7389/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,418,688,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7390/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,418,880,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7391/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,419,072,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7392/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,419,264,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7393/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,419,456,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7394/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,419,648,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7395/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,419,840,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7396/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,420,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7397/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,420,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7398/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,420,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7399/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,420,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7400/500000]
+ optim/total_grad_norm=0.7482
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,420,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7401/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,420,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7402/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,421,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7403/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,421,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7404/500000]
+ train/ActionNoiseL2Loss=0.1463
+ throughput/total_tokens=1,421,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7405/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,421,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7406/500000]
+ train/ActionNoiseL2Loss=0.1040
+ throughput/total_tokens=1,421,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7407/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,422,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7408/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,422,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7409/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,422,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7410/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,422,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7411/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,422,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7412/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,423,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7413/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,423,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7414/500000]
+ train/ActionNoiseL2Loss=0.0863
+ throughput/total_tokens=1,423,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7415/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=1,423,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7416/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=1,423,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7417/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,424,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7418/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=1,424,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7419/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,424,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7420/500000]
+ optim/total_grad_norm=1.010
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,424,640,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7421/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,424,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7422/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,425,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7423/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=1,425,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7424/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,425,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7425/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,425,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7426/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,425,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7427/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,425,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7428/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,426,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7429/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,426,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7430/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,426,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7431/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,426,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7432/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=1,426,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7433/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,427,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7434/500000]
+ train/ActionNoiseL2Loss=0.1389
+ throughput/total_tokens=1,427,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7435/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,427,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7436/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,427,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7437/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,427,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7438/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,428,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7439/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,428,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7440/500000]
+ optim/total_grad_norm=0.6409
+ train/ActionNoiseL2Loss=0.0203
+ throughput/total_tokens=1,428,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7441/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,428,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7442/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,428,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7443/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,429,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7444/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=1,429,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7445/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,429,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7446/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,429,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7447/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,429,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7448/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=1,430,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7449/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,430,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7450/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,430,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7451/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,430,592,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7452/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=1,430,784,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7453/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=1,430,976,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=7454/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,431,168,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7455/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,431,360,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7456/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,431,552,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7457/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,431,744,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7458/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,431,936,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7459/500000]
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,432,128,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7460/500000]
+ optim/total_grad_norm=0.9396
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,432,320,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+ System/Peak GPU Memory (MB)=51,074
+[step=7461/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=1,432,512,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=7462/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,432,704,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=7463/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,432,896,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=7464/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,433,088,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=7465/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=1,433,280,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=7466/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,433,472,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7467/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,433,664,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=7468/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,433,856,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=7469/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,434,048,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0477
+[step=7470/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,434,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7471/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,434,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7472/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,434,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7473/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,434,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7474/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,435,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7475/500000]
+ train/ActionNoiseL2Loss=0.1315
+ throughput/total_tokens=1,435,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7476/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,435,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7477/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,435,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7478/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,435,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7479/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,435,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7480/500000]
+ optim/total_grad_norm=0.8352
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,436,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7481/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,436,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7482/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,436,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7483/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,436,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7484/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,436,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7485/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,437,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7486/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,437,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7487/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,437,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7488/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,437,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7489/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,437,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7490/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,438,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7491/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,438,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7492/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,438,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7493/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,438,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7494/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,438,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7495/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=1,439,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7496/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,439,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7497/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,439,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7498/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,439,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7499/500000]
+ train/ActionNoiseL2Loss=0.0211
+ throughput/total_tokens=1,439,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7500/500000]
+ optim/total_grad_norm=0.9110
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,440,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/13 [13:18:06] INFO | >> Saving config... checkpoint.py:608
+10/13 [13:18:52] INFO | >> Saving model state... checkpoint.py:796
+10/13 [13:20:07] INFO | >> Saving optim state... checkpoint.py:811
+10/13 [13:21:41] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=7501/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,440,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=7502/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,440,384,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=7503/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,440,576,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=7504/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,440,768,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=7505/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,440,960,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7506/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,441,152,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7507/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,441,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7508/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=1,441,536,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7509/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,441,728,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=7510/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,441,920,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=7511/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,442,112,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7512/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,442,304,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7513/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,442,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7514/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=1,442,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7515/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,442,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7516/500000]
+ train/ActionNoiseL2Loss=0.1233
+ throughput/total_tokens=1,443,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7517/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,443,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7518/500000]
+ train/ActionNoiseL2Loss=0.0931
+ throughput/total_tokens=1,443,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7519/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,443,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7520/500000]
+ optim/total_grad_norm=1.117
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,443,840,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7521/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,444,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7522/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,444,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7523/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,444,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7524/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,444,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7525/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,444,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7526/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,444,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7527/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,445,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7528/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,445,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7529/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,445,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7530/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,445,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7531/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,445,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7532/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=1,446,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7533/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,446,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7534/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,446,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7535/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,446,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7536/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,446,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7537/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,447,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7538/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,447,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7539/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,447,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7540/500000]
+ optim/total_grad_norm=0.9087
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,447,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7541/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,447,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7542/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,448,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7543/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,448,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7544/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,448,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7545/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,448,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7546/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,448,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7547/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,449,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7548/500000]
+ train/ActionNoiseL2Loss=0.1149
+ throughput/total_tokens=1,449,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7549/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,449,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7550/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,449,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7551/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,449,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7552/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,449,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7553/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,450,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7554/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,450,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7555/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=1,450,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7556/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,450,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7557/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=1,450,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7558/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,451,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7559/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,451,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7560/500000]
+ optim/total_grad_norm=0.8219
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,451,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7561/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,451,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7562/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,451,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7563/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,452,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7564/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,452,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7565/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,452,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7566/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,452,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7567/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,452,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7568/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,453,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7569/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,453,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7570/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,453,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7571/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,453,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7572/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=1,453,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7573/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,454,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7574/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,454,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7575/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=1,454,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7576/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,454,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7577/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,454,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7578/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,454,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7579/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,455,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7580/500000]
+ optim/total_grad_norm=1.033
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,455,360,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7581/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,455,552,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7582/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=1,455,744,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7583/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,455,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7584/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,456,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7585/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,456,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7586/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,456,512,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7587/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,456,704,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7588/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,456,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7589/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,457,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7590/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,457,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7591/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,457,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7592/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,457,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7593/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,457,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7594/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,458,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7595/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,458,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7596/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,458,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7597/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,458,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7598/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,458,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7599/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,459,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7600/500000]
+ optim/total_grad_norm=0.9380
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,459,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7601/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,459,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7602/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,459,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7603/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,459,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7604/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,459,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7605/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=1,460,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7606/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,460,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7607/500000]
+ train/ActionNoiseL2Loss=0.1258
+ throughput/total_tokens=1,460,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7608/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,460,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7609/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,460,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7610/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,461,120,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7611/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,461,312,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7612/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,461,504,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7613/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,461,696,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7614/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,461,888,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7615/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=1,462,080,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7616/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,462,272,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7617/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,462,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7618/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,462,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7619/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,462,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7620/500000]
+ optim/total_grad_norm=0.7557
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,463,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7621/500000]
+ train/ActionNoiseL2Loss=0.0229
+ throughput/total_tokens=1,463,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7622/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,463,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7623/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,463,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7624/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,463,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7625/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,464,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7626/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,464,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7627/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,464,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7628/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,464,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7629/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,464,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7630/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,464,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7631/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,465,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7632/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,465,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7633/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,465,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7634/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,465,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7635/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,465,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7636/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,466,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7637/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,466,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7638/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,466,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7639/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,466,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7640/500000]
+ optim/total_grad_norm=0.8628
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=1,466,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7641/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,467,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7642/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,467,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7643/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,467,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7644/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,467,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7645/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,467,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7646/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,468,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7647/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,468,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7648/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,468,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7649/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=1,468,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7650/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,468,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7651/500000]
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=1,468,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7652/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,469,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7653/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,469,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7654/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,469,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7655/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,469,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7656/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=1,469,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7657/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,470,144,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7658/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,470,336,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7659/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,470,528,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=7660/500000]
+ optim/total_grad_norm=0.8523
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,470,720,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,074
+[step=7661/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,470,912,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7662/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,471,104,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7663/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,471,296,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7664/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,471,488,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7665/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=1,471,680,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7666/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,471,872,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=7667/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,472,064,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=7668/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,472,256,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=7669/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=1,472,448,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=7670/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,472,640,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7671/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,472,832,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7672/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,473,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7673/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,473,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7674/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,473,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7675/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,473,600,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7676/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,473,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7677/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,473,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7678/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,474,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7679/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,474,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7680/500000]
+ optim/total_grad_norm=0.7496
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,474,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7681/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,474,752,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7682/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,474,944,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7683/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,475,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7684/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,475,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7685/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=1,475,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7686/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,475,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7687/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,475,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7688/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,476,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7689/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,476,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7690/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=1,476,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7691/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,476,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7692/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,476,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7693/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,477,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7694/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,477,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7695/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,477,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7696/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,477,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7697/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,477,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7698/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,478,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7699/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,478,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7700/500000]
+ optim/total_grad_norm=0.8408
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,478,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7701/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,478,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7702/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,478,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7703/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,478,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7704/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,479,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7705/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=1,479,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7706/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,479,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7707/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,479,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7708/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,479,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7709/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,480,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7710/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,480,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7711/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,480,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7712/500000]
+ train/ActionNoiseL2Loss=0.1207
+ throughput/total_tokens=1,480,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7713/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,480,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7714/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,481,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7715/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,481,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7716/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,481,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7717/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=1,481,664,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7718/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,481,856,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7719/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,482,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7720/500000]
+ optim/total_grad_norm=0.6014
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,482,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7721/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,482,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7722/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,482,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7723/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,482,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7724/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,483,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7725/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,483,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7726/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,483,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7727/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=1,483,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7728/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,483,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7729/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,483,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7730/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,484,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7731/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,484,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7732/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,484,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7733/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=1,484,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7734/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,484,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7735/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,485,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7736/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,485,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7737/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,485,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7738/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,485,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7739/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,485,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7740/500000]
+ optim/total_grad_norm=0.9596
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,486,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7741/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,486,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7742/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,486,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7743/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,486,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7744/500000]
+ train/ActionNoiseL2Loss=0.1270
+ throughput/total_tokens=1,486,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7745/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,487,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7746/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,487,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7747/500000]
+ train/ActionNoiseL2Loss=0.1317
+ throughput/total_tokens=1,487,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7748/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,487,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7749/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,487,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7750/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,488,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7751/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=1,488,192,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7752/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,488,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7753/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,488,576,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7754/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,488,768,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7755/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,488,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7756/500000]
+ train/ActionNoiseL2Loss=0.1200
+ throughput/total_tokens=1,489,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7757/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,489,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7758/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,489,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7759/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,489,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7760/500000]
+ optim/total_grad_norm=0.7333
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,489,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7761/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,490,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7762/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,490,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7763/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,490,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7764/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,490,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7765/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,490,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7766/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,491,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7767/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,491,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7768/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,491,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7769/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,491,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7770/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,491,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7771/500000]
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=1,492,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7772/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,492,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7773/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,492,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7774/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,492,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7775/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,492,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7776/500000]
+ train/ActionNoiseL2Loss=0.1193
+ throughput/total_tokens=1,492,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7777/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,493,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7778/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,493,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7779/500000]
+ train/ActionNoiseL2Loss=0.0983
+ throughput/total_tokens=1,493,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7780/500000]
+ optim/total_grad_norm=0.7625
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,493,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7781/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,493,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7782/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,494,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7783/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,494,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7784/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,494,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7785/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,494,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7786/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,494,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7787/500000]
+ train/ActionNoiseL2Loss=0.1561
+ throughput/total_tokens=1,495,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7788/500000]
+ train/ActionNoiseL2Loss=0.0967
+ throughput/total_tokens=1,495,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7789/500000]
+ train/ActionNoiseL2Loss=0.1397
+ throughput/total_tokens=1,495,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7790/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,495,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7791/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=1,495,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7792/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,496,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7793/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,496,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7794/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,496,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7795/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,496,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7796/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,496,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7797/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,497,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7798/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,497,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7799/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,497,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7800/500000]
+ optim/total_grad_norm=0.9283
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,497,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7801/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,497,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7802/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,497,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7803/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,498,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7804/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,498,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7805/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,498,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7806/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,498,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7807/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,498,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7808/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,499,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7809/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=1,499,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7810/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,499,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7811/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,499,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7812/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,499,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7813/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,500,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7814/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=1,500,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7815/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,500,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7816/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,500,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7817/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,500,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7818/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,501,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7819/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,501,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7820/500000]
+ optim/total_grad_norm=0.9853
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,501,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7821/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,501,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7822/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=1,501,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7823/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,502,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7824/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=1,502,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7825/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,502,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7826/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,502,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7827/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,502,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7828/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,502,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7829/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,503,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7830/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,503,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7831/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,503,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7832/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,503,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7833/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,503,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7834/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,504,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7835/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,504,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7836/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,504,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7837/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,504,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7838/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,504,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7839/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,505,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7840/500000]
+ optim/total_grad_norm=0.5634
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,505,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7841/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,505,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7842/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,505,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7843/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=1,505,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7844/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,506,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7845/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,506,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7846/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,506,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7847/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,506,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7848/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,506,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7849/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,507,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7850/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,507,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7851/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,507,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7852/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,507,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7853/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,507,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7854/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,507,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7855/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,508,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7856/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,508,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7857/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=1,508,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7858/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,508,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7859/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,508,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7860/500000]
+ optim/total_grad_norm=1.525
+ train/ActionNoiseL2Loss=0.0953
+ throughput/total_tokens=1,509,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7861/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,509,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7862/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,509,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7863/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,509,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7864/500000]
+ train/ActionNoiseL2Loss=0.1084
+ throughput/total_tokens=1,509,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7865/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,510,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7866/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,510,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7867/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,510,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7868/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=1,510,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7869/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,510,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7870/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,511,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7871/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,511,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7872/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,511,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7873/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,511,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7874/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,511,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7875/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,512,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7876/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,512,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7877/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,512,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7878/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,512,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7879/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,512,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7880/500000]
+ optim/total_grad_norm=0.5876
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,512,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7881/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=1,513,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7882/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,513,344,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7883/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,513,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7884/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,513,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7885/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=1,513,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7886/500000]
+ train/ActionNoiseL2Loss=0.1298
+ throughput/total_tokens=1,514,112,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=7887/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,514,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7888/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,514,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7889/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=1,514,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7890/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,514,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=7891/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,515,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7892/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=1,515,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7893/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,515,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7894/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,515,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7895/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,515,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7896/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=1,516,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7897/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,516,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7898/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,516,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7899/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=1,516,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7900/500000]
+ optim/total_grad_norm=0.9835
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,516,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7901/500000]
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,516,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7902/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,517,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7903/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=1,517,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7904/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,517,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7905/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,517,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7906/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,517,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7907/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,518,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7908/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,518,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7909/500000]
+ train/ActionNoiseL2Loss=0.0906
+ throughput/total_tokens=1,518,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7910/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,518,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7911/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,518,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7912/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,519,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7913/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,519,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7914/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,519,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7915/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,519,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7916/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,519,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7917/500000]
+ train/ActionNoiseL2Loss=0.1396
+ throughput/total_tokens=1,520,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7918/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,520,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7919/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,520,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7920/500000]
+ optim/total_grad_norm=1.500
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,520,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7921/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,520,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7922/500000]
+ train/ActionNoiseL2Loss=0.0329
+ throughput/total_tokens=1,521,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7923/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,521,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7924/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,521,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7925/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,521,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7926/500000]
+ train/ActionNoiseL2Loss=0.1477
+ throughput/total_tokens=1,521,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7927/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,521,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7928/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,522,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7929/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,522,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7930/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=1,522,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7931/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=1,522,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7932/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,522,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7933/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,523,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7934/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,523,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7935/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,523,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7936/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,523,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7937/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,523,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7938/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,524,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7939/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,524,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7940/500000]
+ optim/total_grad_norm=1.054
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,524,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7941/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,524,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7942/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,524,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7943/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,525,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7944/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,525,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7945/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,525,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7946/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,525,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7947/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,525,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=7948/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,526,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7949/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,526,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=7950/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,526,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7951/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,526,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7952/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,526,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7953/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,526,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7954/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,527,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=7955/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=1,527,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7956/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,527,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7957/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,527,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7958/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,527,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7959/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,528,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7960/500000]
+ optim/total_grad_norm=0.8932
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,528,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7961/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,528,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=7962/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,528,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=7963/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,528,896,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7964/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,529,088,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7965/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,529,280,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7966/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,529,472,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7967/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,529,664,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7968/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,529,856,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7969/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,530,048,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=7970/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,530,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=7971/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=1,530,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7972/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,530,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7973/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,530,816,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7974/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,531,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7975/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,531,200,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7976/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,531,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7977/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,531,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7978/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,531,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7979/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,531,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=7980/500000]
+ optim/total_grad_norm=1.068
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,532,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7981/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,532,352,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=7982/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,532,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7983/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,532,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7984/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,532,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7985/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,533,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7986/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,533,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7987/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,533,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7988/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,533,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7989/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,533,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7990/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,534,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=7991/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,534,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7992/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,534,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=7993/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,534,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7994/500000]
+ train/ActionNoiseL2Loss=0.0971
+ throughput/total_tokens=1,534,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7995/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,535,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7996/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,535,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7997/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,535,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7998/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,535,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=7999/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,535,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8000/500000]
+ optim/total_grad_norm=0.8881
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,536,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/13 [16:16:52] INFO | >> Saving config... checkpoint.py:608
+10/13 [16:17:48] INFO | >> Saving model state... checkpoint.py:796
+10/13 [16:19:08] INFO | >> Saving optim state... checkpoint.py:811
+10/13 [16:20:40] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8001/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,536,192,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0473
+[step=8002/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,536,384,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=8003/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,536,576,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=8004/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,536,768,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=8005/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,536,960,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=8006/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,537,152,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8007/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,537,344,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8008/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,537,536,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8009/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,537,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8010/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,537,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=8011/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,538,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8012/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=1,538,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8013/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,538,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8014/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,538,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8015/500000]
+ train/ActionNoiseL2Loss=0.1069
+ throughput/total_tokens=1,538,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8016/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,539,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8017/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,539,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8018/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,539,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8019/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,539,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8020/500000]
+ optim/total_grad_norm=1.204
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=1,539,840,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8021/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,540,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8022/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,540,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=8023/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,540,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8024/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=1,540,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8025/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,540,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8026/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,540,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8027/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,541,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8028/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,541,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8029/500000]
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,541,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8030/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,541,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8031/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,541,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8032/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,542,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8033/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,542,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8034/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,542,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8035/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,542,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8036/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,542,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8037/500000]
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,543,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8038/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,543,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8039/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,543,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8040/500000]
+ optim/total_grad_norm=0.9523
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=1,543,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8041/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,543,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8042/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,544,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8043/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,544,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8044/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,544,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8045/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,544,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8046/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=1,544,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8047/500000]
+ train/ActionNoiseL2Loss=0.1026
+ throughput/total_tokens=1,545,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8048/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,545,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8049/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,545,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8050/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,545,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8051/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=1,545,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8052/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,545,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8053/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,546,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8054/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,546,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8055/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,546,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8056/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,546,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8057/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,546,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8058/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,547,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8059/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,547,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8060/500000]
+ optim/total_grad_norm=1.001
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,547,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8061/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,547,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8062/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,547,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8063/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,548,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8064/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,548,288,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8065/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=1,548,480,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8066/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,548,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8067/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,548,864,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8068/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,549,056,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8069/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,549,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8070/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,549,440,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8071/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,549,632,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8072/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,549,824,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8073/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,550,016,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8074/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=1,550,208,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8075/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,550,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8076/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=1,550,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8077/500000]
+ train/ActionNoiseL2Loss=0.0965
+ throughput/total_tokens=1,550,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=8078/500000]
+ train/ActionNoiseL2Loss=0.0976
+ throughput/total_tokens=1,550,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8079/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,551,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8080/500000]
+ optim/total_grad_norm=0.7255
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,551,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8081/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,551,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8082/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=1,551,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8083/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,551,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8084/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,552,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8085/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,552,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8086/500000]
+ train/ActionNoiseL2Loss=0.1022
+ throughput/total_tokens=1,552,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8087/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,552,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8088/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,552,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8089/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,553,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8090/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,553,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8091/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,553,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8092/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,553,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8093/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,553,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8094/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,554,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8095/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,554,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8096/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,554,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8097/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,554,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8098/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,554,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8099/500000]
+ train/ActionNoiseL2Loss=0.0267
+ throughput/total_tokens=1,555,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8100/500000]
+ optim/total_grad_norm=0.7081
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,555,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8101/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,555,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8102/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,555,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8103/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,555,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8104/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,555,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8105/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=1,556,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8106/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,556,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8107/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,556,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8108/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,556,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8109/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,556,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8110/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=1,557,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=8111/500000]
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=1,557,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8112/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,557,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8113/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,557,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8114/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,557,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8115/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,558,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8116/500000]
+ train/ActionNoiseL2Loss=0.1255
+ throughput/total_tokens=1,558,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8117/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,558,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8118/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=1,558,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8119/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=1,558,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8120/500000]
+ optim/total_grad_norm=0.8103
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,559,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8121/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,559,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8122/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,559,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8123/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,559,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8124/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,559,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8125/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,560,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8126/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=1,560,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8127/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=1,560,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8128/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,560,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8129/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,560,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8130/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,560,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8131/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,561,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8132/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=1,561,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8133/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,561,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8134/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,561,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8135/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=1,561,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8136/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,562,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8137/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,562,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8138/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,562,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8139/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,562,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8140/500000]
+ optim/total_grad_norm=0.7262
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,562,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8141/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,563,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8142/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,563,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8143/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,563,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8144/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=1,563,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8145/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,563,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8146/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,564,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8147/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,564,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8148/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,564,416,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8149/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=1,564,608,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8150/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,564,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8151/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,564,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8152/500000]
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=1,565,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8153/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,565,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8154/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,565,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8155/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,565,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8156/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,565,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8157/500000]
+ train/ActionNoiseL2Loss=0.0963
+ throughput/total_tokens=1,566,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8158/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,566,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8159/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,566,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8160/500000]
+ optim/total_grad_norm=1.556
+ train/ActionNoiseL2Loss=0.1090
+ throughput/total_tokens=1,566,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8161/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=1,566,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8162/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,567,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8163/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,567,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8164/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,567,488,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8165/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,567,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8166/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=1,567,872,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8167/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,568,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8168/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,568,256,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8169/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,568,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8170/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,568,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8171/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,568,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8172/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,569,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8173/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,569,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8174/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,569,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8175/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=1,569,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8176/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,569,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8177/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,569,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8178/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,570,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8179/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,570,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8180/500000]
+ optim/total_grad_norm=0.8495
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,570,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8181/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,570,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8182/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,570,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8183/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=1,571,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8184/500000]
+ train/ActionNoiseL2Loss=0.1273
+ throughput/total_tokens=1,571,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8185/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,571,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8186/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,571,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8187/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,571,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8188/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,572,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8189/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,572,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8190/500000]
+ train/ActionNoiseL2Loss=0.1184
+ throughput/total_tokens=1,572,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8191/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,572,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8192/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=1,572,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8193/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,573,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8194/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,573,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8195/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,573,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8196/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,573,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8197/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,573,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8198/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,574,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8199/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=1,574,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8200/500000]
+ optim/total_grad_norm=0.7238
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,574,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8201/500000]
+ train/ActionNoiseL2Loss=0.1231
+ throughput/total_tokens=1,574,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8202/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,574,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8203/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,574,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8204/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,575,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8205/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,575,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8206/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,575,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8207/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=1,575,744,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8208/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,575,936,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8209/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,576,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8210/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,576,320,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=8211/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,576,512,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8212/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,576,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8213/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,576,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8214/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,577,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8215/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,577,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8216/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,577,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8217/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,577,664,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8218/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,577,856,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8219/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,578,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8220/500000]
+ optim/total_grad_norm=0.5261
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,578,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8221/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,578,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8222/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,578,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8223/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,578,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8224/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=1,579,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8225/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,579,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8226/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,579,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8227/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,579,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8228/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=1,579,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8229/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,579,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8230/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,580,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8231/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,580,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8232/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,580,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8233/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,580,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8234/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,580,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8235/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,581,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8236/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,581,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8237/500000]
+ train/ActionNoiseL2Loss=0.1611
+ throughput/total_tokens=1,581,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8238/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,581,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8239/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,581,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8240/500000]
+ optim/total_grad_norm=0.6972
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,582,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8241/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,582,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8242/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,582,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8243/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,582,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8244/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,582,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8245/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,583,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8246/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,583,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8247/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,583,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8248/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,583,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8249/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,583,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8250/500000]
+ train/ActionNoiseL2Loss=0.1205
+ throughput/total_tokens=1,584,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8251/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,584,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8252/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=1,584,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8253/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,584,576,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8254/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,584,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8255/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,584,960,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8256/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,585,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8257/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=1,585,344,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8258/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,585,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8259/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,585,728,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8260/500000]
+ optim/total_grad_norm=0.8596
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,585,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8261/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,586,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8262/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,586,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8263/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,586,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8264/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,586,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8265/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=1,586,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8266/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,587,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8267/500000]
+ train/ActionNoiseL2Loss=0.1112
+ throughput/total_tokens=1,587,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8268/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,587,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8269/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,587,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8270/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,587,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8271/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,588,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8272/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,588,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8273/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,588,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8274/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=1,588,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8275/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,588,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8276/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,588,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8277/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,589,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8278/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,589,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8279/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,589,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8280/500000]
+ optim/total_grad_norm=0.5186
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=1,589,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8281/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,589,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8282/500000]
+ train/ActionNoiseL2Loss=0.1045
+ throughput/total_tokens=1,590,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8283/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,590,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8284/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,590,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8285/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,590,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8286/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,590,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8287/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,591,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8288/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,591,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8289/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,591,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8290/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=1,591,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8291/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,591,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8292/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,592,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8293/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,592,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8294/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=1,592,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8295/500000]
+ train/ActionNoiseL2Loss=0.1074
+ throughput/total_tokens=1,592,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8296/500000]
+ train/ActionNoiseL2Loss=0.0773
+ throughput/total_tokens=1,592,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8297/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,593,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8298/500000]
+ train/ActionNoiseL2Loss=0.1147
+ throughput/total_tokens=1,593,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8299/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,593,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8300/500000]
+ optim/total_grad_norm=1.183
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,593,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8301/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,593,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8302/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=1,593,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8303/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,594,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8304/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,594,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8305/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,594,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8306/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,594,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8307/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,594,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8308/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,595,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8309/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,595,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8310/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,595,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8311/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=1,595,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8312/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,595,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8313/500000]
+ train/ActionNoiseL2Loss=0.0975
+ throughput/total_tokens=1,596,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8314/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,596,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8315/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,596,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8316/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,596,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8317/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,596,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8318/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,597,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8319/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,597,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8320/500000]
+ optim/total_grad_norm=1.240
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,597,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8321/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,597,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8322/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,597,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8323/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,598,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8324/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,598,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8325/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,598,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8326/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,598,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8327/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,598,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8328/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,598,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8329/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,599,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8330/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,599,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8331/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,599,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8332/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,599,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8333/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,599,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8334/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,600,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8335/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,600,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8336/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,600,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8337/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,600,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8338/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,600,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8339/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=1,601,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8340/500000]
+ optim/total_grad_norm=0.5001
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,601,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8341/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,601,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8342/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,601,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8343/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,601,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8344/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,602,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8345/500000]
+ train/ActionNoiseL2Loss=0.1201
+ throughput/total_tokens=1,602,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8346/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,602,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8347/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,602,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8348/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=1,602,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8349/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,603,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8350/500000]
+ train/ActionNoiseL2Loss=0.0197
+ throughput/total_tokens=1,603,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8351/500000]
+ train/ActionNoiseL2Loss=0.0242
+ throughput/total_tokens=1,603,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8352/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,603,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8353/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,603,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8354/500000]
+ train/ActionNoiseL2Loss=0.1131
+ throughput/total_tokens=1,603,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8355/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,604,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8356/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,604,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8357/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,604,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8358/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,604,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8359/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,604,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8360/500000]
+ optim/total_grad_norm=1.316
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=1,605,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8361/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,605,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8362/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,605,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8363/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,605,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8364/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,605,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8365/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,606,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8366/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,606,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8367/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=1,606,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8368/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,606,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8369/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,606,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8370/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,607,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8371/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,607,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8372/500000]
+ train/ActionNoiseL2Loss=0.1030
+ throughput/total_tokens=1,607,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8373/500000]
+ train/ActionNoiseL2Loss=0.0939
+ throughput/total_tokens=1,607,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8374/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,607,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8375/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,608,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8376/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=1,608,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8377/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,608,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8378/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,608,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8379/500000]
+ train/ActionNoiseL2Loss=0.1320
+ throughput/total_tokens=1,608,768,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8380/500000]
+ optim/total_grad_norm=0.9741
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=1,608,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8381/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,609,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8382/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,609,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8383/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,609,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8384/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,609,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8385/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,609,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8386/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=1,610,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8387/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,610,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8388/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,610,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8389/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=1,610,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8390/500000]
+ train/ActionNoiseL2Loss=0.1277
+ throughput/total_tokens=1,610,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8391/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,611,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8392/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,611,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8393/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,611,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8394/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,611,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8395/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,611,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8396/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,612,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8397/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,612,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8398/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,612,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8399/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,612,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8400/500000]
+ optim/total_grad_norm=0.8522
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,612,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8401/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,612,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8402/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,613,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8403/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,613,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8404/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,613,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8405/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,613,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8406/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,613,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8407/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,614,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8408/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,614,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8409/500000]
+ train/ActionNoiseL2Loss=0.1615
+ throughput/total_tokens=1,614,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8410/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=1,614,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8411/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=1,614,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8412/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,615,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8413/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,615,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8414/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,615,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8415/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=1,615,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8416/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,615,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8417/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,616,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8418/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=1,616,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8419/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,616,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8420/500000]
+ optim/total_grad_norm=0.7161
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,616,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8421/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,616,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8422/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=1,617,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8423/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,617,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8424/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,617,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8425/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,617,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8426/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,617,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8427/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=1,617,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8428/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,618,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8429/500000]
+ train/ActionNoiseL2Loss=0.0644
+ throughput/total_tokens=1,618,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8430/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,618,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8431/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=1,618,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8432/500000]
+ train/ActionNoiseL2Loss=0.0900
+ throughput/total_tokens=1,618,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8433/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=1,619,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8434/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,619,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8435/500000]
+ train/ActionNoiseL2Loss=0.0286
+ throughput/total_tokens=1,619,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8436/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,619,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8437/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,619,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8438/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,620,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8439/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,620,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8440/500000]
+ optim/total_grad_norm=1.005
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,620,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8441/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,620,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8442/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,620,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8443/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,621,056,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8444/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,621,248,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8445/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,621,440,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8446/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,621,632,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8447/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,621,824,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8448/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,622,016,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8449/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,622,208,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8450/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=1,622,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8451/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,622,592,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8452/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,622,784,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8453/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,622,976,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8454/500000]
+ train/ActionNoiseL2Loss=0.1113
+ throughput/total_tokens=1,623,168,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8455/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,623,360,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8456/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,623,552,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8457/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,623,744,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8458/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,623,936,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8459/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,624,128,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8460/500000]
+ optim/total_grad_norm=0.8880
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,624,320,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=8461/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,624,512,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8462/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,624,704,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8463/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,624,896,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8464/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,625,088,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8465/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,625,280,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8466/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,625,472,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8467/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,625,664,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8468/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,625,856,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8469/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,626,048,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8470/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,626,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8471/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,626,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=8472/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,626,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8473/500000]
+ train/ActionNoiseL2Loss=0.1066
+ throughput/total_tokens=1,626,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8474/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,627,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8475/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,627,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8476/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,627,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8477/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,627,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8478/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,627,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8479/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=1,627,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8480/500000]
+ optim/total_grad_norm=0.8094
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,628,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8481/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,628,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8482/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,628,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8483/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=1,628,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8484/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,628,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8485/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,629,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8486/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,629,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8487/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,629,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8488/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=1,629,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8489/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,629,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8490/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,630,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8491/500000]
+ train/ActionNoiseL2Loss=0.0904
+ throughput/total_tokens=1,630,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8492/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,630,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8493/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,630,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8494/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,630,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8495/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,631,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8496/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,631,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8497/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,631,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8498/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=1,631,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8499/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,631,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8500/500000]
+ optim/total_grad_norm=1.179
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,632,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/13 [19:16:02] INFO | >> Saving config... checkpoint.py:608
+10/13 [19:16:35] INFO | >> Saving model state... checkpoint.py:796
+10/13 [19:17:48] INFO | >> Saving optim state... checkpoint.py:811
+10/13 [19:19:22] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=8501/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,632,192,000
+ throughput/device/tokens_per_second=1,123
+ throughput/device/batches_per_second=0.0468
+[step=8502/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,632,384,000
+ throughput/device/tokens_per_second=1,124
+ throughput/device/batches_per_second=0.0468
+[step=8503/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,632,576,000
+ throughput/device/tokens_per_second=1,114
+ throughput/device/batches_per_second=0.0465
+[step=8504/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=1,632,768,000
+ throughput/device/tokens_per_second=1,122
+ throughput/device/batches_per_second=0.0468
+[step=8505/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,632,960,000
+ throughput/device/tokens_per_second=1,127
+ throughput/device/batches_per_second=0.0470
+[step=8506/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,633,152,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=8507/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,633,344,000
+ throughput/device/tokens_per_second=1,135
+ throughput/device/batches_per_second=0.0473
+[step=8508/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,633,536,000
+ throughput/device/tokens_per_second=1,137
+ throughput/device/batches_per_second=0.0474
+[step=8509/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,633,728,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0475
+[step=8510/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,633,920,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+ System/Peak GPU Memory (MB)=51,074
+[step=8511/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,634,112,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=8512/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,634,304,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=8513/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,634,496,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=8514/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,634,688,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=8515/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,634,880,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=8516/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,635,072,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=8517/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,635,264,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=8518/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,635,456,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=8519/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,635,648,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=8520/500000]
+ optim/total_grad_norm=0.7519
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,635,840,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+ System/Peak GPU Memory (MB)=51,074
+[step=8521/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,636,032,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8522/500000]
+ train/ActionNoiseL2Loss=0.0994
+ throughput/total_tokens=1,636,224,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8523/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,636,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8524/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,636,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8525/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,636,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8526/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,636,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8527/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,637,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8528/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,637,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8529/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,637,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8530/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,637,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8531/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,637,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8532/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,638,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8533/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,638,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8534/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,638,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8535/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,638,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8536/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,638,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8537/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,639,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8538/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,639,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8539/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,639,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8540/500000]
+ optim/total_grad_norm=0.7932
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,639,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8541/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,639,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8542/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,640,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8543/500000]
+ train/ActionNoiseL2Loss=0.1088
+ throughput/total_tokens=1,640,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8544/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,640,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8545/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,640,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8546/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,640,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8547/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,641,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8548/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,641,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8549/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,641,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8550/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,641,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8551/500000]
+ train/ActionNoiseL2Loss=0.0208
+ throughput/total_tokens=1,641,792,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8552/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,641,984,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8553/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,642,176,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8554/500000]
+ train/ActionNoiseL2Loss=0.0972
+ throughput/total_tokens=1,642,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8555/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,642,560,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8556/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,642,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8557/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,642,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8558/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,643,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8559/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,643,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8560/500000]
+ optim/total_grad_norm=0.8052
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,643,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8561/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,643,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8562/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,643,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8563/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,644,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8564/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,644,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8565/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,644,480,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8566/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,644,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8567/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,644,864,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8568/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,645,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8569/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,645,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8570/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,645,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8571/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,645,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8572/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,645,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8573/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,646,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8574/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,646,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8575/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,646,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8576/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,646,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8577/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,646,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8578/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,646,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8579/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,647,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8580/500000]
+ optim/total_grad_norm=1.079
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,647,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8581/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,647,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8582/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,647,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8583/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,647,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8584/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,648,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8585/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,648,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8586/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,648,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8587/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,648,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8588/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=1,648,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8589/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,649,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8590/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,649,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8591/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,649,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8592/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,649,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8593/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,649,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8594/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,650,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8595/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=1,650,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8596/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,650,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8597/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,650,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8598/500000]
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,650,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8599/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=1,651,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8600/500000]
+ optim/total_grad_norm=0.9702
+ train/ActionNoiseL2Loss=0.0927
+ throughput/total_tokens=1,651,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8601/500000]
+ train/ActionNoiseL2Loss=0.1021
+ throughput/total_tokens=1,651,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8602/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=1,651,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8603/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,651,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8604/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,651,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8605/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,652,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8606/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,652,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8607/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,652,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8608/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,652,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8609/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,652,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8610/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,653,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8611/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,653,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8612/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,653,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8613/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,653,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8614/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,653,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8615/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,654,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8616/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,654,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8617/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,654,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8618/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,654,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8619/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,654,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8620/500000]
+ optim/total_grad_norm=1.020
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=1,655,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8621/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,655,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8622/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,655,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8623/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=1,655,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8624/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,655,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8625/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=1,656,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8626/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,656,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8627/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,656,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8628/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,656,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8629/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,656,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8630/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,656,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8631/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,657,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8632/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,657,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8633/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,657,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8634/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=1,657,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8635/500000]
+ train/ActionNoiseL2Loss=0.0924
+ throughput/total_tokens=1,657,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8636/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,658,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8637/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,658,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8638/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,658,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8639/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,658,688,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8640/500000]
+ optim/total_grad_norm=0.7040
+ train/ActionNoiseL2Loss=0.0238
+ throughput/total_tokens=1,658,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8641/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=1,659,072,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8642/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,659,264,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8643/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,659,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8644/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,659,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8645/500000]
+ train/ActionNoiseL2Loss=0.1159
+ throughput/total_tokens=1,659,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8646/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,660,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8647/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,660,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8648/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,660,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8649/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,660,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8650/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,660,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8651/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,660,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8652/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,661,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8653/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=1,661,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8654/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,661,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8655/500000]
+ train/ActionNoiseL2Loss=0.1072
+ throughput/total_tokens=1,661,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8656/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,661,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8657/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=1,662,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8658/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,662,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8659/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,662,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8660/500000]
+ optim/total_grad_norm=0.6786
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,662,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8661/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,662,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8662/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,663,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8663/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=1,663,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8664/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,663,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8665/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=1,663,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8666/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,663,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8667/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,664,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8668/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,664,256,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8669/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,664,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8670/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,664,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8671/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,664,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8672/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,665,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8673/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,665,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8674/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=1,665,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8675/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,665,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8676/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,665,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8677/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,665,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8678/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,666,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8679/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,666,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8680/500000]
+ optim/total_grad_norm=0.8090
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,666,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8681/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=1,666,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8682/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,666,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8683/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,667,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8684/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,667,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8685/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,667,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8686/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,667,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8687/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=1,667,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8688/500000]
+ train/ActionNoiseL2Loss=0.0914
+ throughput/total_tokens=1,668,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8689/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=1,668,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8690/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=1,668,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8691/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,668,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8692/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=1,668,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8693/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,669,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8694/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,669,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8695/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,669,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8696/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=1,669,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8697/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=1,669,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8698/500000]
+ train/ActionNoiseL2Loss=0.1469
+ throughput/total_tokens=1,670,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8699/500000]
+ train/ActionNoiseL2Loss=0.1187
+ throughput/total_tokens=1,670,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8700/500000]
+ optim/total_grad_norm=1.110
+ train/ActionNoiseL2Loss=0.0830
+ throughput/total_tokens=1,670,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8701/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,670,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8702/500000]
+ train/ActionNoiseL2Loss=0.0276
+ throughput/total_tokens=1,670,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8703/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=1,670,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8704/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,671,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8705/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,671,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8706/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,671,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8707/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,671,744,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=8708/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,671,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8709/500000]
+ train/ActionNoiseL2Loss=0.1108
+ throughput/total_tokens=1,672,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8710/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,672,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8711/500000]
+ train/ActionNoiseL2Loss=0.0792
+ throughput/total_tokens=1,672,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8712/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,672,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8713/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=1,672,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8714/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,673,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8715/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,673,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8716/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,673,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8717/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,673,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8718/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,673,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8719/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=1,674,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8720/500000]
+ optim/total_grad_norm=0.8148
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,674,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8721/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,674,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8722/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,674,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8723/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,674,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8724/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,675,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8725/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,675,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8726/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,675,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8727/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=1,675,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8728/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=1,675,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8729/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,675,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8730/500000]
+ train/ActionNoiseL2Loss=0.1306
+ throughput/total_tokens=1,676,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8731/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,676,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8732/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,676,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8733/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,676,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8734/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=1,676,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8735/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,677,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8736/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,677,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8737/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,677,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8738/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,677,696,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8739/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,677,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8740/500000]
+ optim/total_grad_norm=1.243
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,678,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8741/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,678,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8742/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=1,678,464,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8743/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,678,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8744/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,678,848,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8745/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,679,040,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8746/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,679,232,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8747/500000]
+ train/ActionNoiseL2Loss=0.0881
+ throughput/total_tokens=1,679,424,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8748/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,679,616,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8749/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,679,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8750/500000]
+ train/ActionNoiseL2Loss=0.0855
+ throughput/total_tokens=1,680,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8751/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,680,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8752/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,680,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8753/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,680,576,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8754/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,680,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8755/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,680,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8756/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=1,681,152,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8757/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,681,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8758/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,681,536,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8759/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,681,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8760/500000]
+ optim/total_grad_norm=0.8033
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,681,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8761/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,682,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8762/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,682,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8763/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,682,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8764/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=1,682,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8765/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,682,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8766/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,683,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8767/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,683,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8768/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,683,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8769/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,683,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8770/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,683,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8771/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,684,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8772/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=1,684,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8773/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,684,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8774/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,684,608,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8775/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,684,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8776/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,684,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8777/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,685,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8778/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,685,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8779/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,685,568,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8780/500000]
+ optim/total_grad_norm=0.7047
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=1,685,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8781/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,685,952,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8782/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,686,144,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8783/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,686,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8784/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,686,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8785/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=1,686,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8786/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,686,912,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8787/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,687,104,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8788/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,687,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8789/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,687,488,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8790/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,687,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8791/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,687,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8792/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=1,688,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8793/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,688,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8794/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,688,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8795/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,688,640,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8796/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,688,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8797/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,689,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8798/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,689,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8799/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=1,689,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8800/500000]
+ optim/total_grad_norm=0.7578
+ train/ActionNoiseL2Loss=0.1109
+ throughput/total_tokens=1,689,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8801/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,689,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8802/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,689,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8803/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,690,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8804/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,690,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8805/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,690,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8806/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,690,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8807/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=1,690,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8808/500000]
+ train/ActionNoiseL2Loss=0.0947
+ throughput/total_tokens=1,691,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8809/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,691,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8810/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,691,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8811/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=1,691,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8812/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,691,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8813/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,692,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8814/500000]
+ train/ActionNoiseL2Loss=0.1266
+ throughput/total_tokens=1,692,288,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8815/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,692,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8816/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,692,672,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8817/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,692,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8818/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,693,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8819/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,693,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8820/500000]
+ optim/total_grad_norm=0.8593
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,693,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8821/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=1,693,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8822/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,693,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8823/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,694,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8824/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,694,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8825/500000]
+ train/ActionNoiseL2Loss=0.0992
+ throughput/total_tokens=1,694,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8826/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,694,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8827/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=1,694,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8828/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,694,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8829/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,695,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8830/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=1,695,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8831/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,695,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8832/500000]
+ train/ActionNoiseL2Loss=0.1168
+ throughput/total_tokens=1,695,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8833/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,695,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8834/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,696,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8835/500000]
+ train/ActionNoiseL2Loss=0.1346
+ throughput/total_tokens=1,696,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8836/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,696,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8837/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=1,696,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8838/500000]
+ train/ActionNoiseL2Loss=0.1050
+ throughput/total_tokens=1,696,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8839/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,697,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8840/500000]
+ optim/total_grad_norm=1.173
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,697,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8841/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,697,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8842/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,697,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8843/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,697,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8844/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,698,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8845/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,698,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8846/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,698,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8847/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,698,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8848/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,698,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8849/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,699,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8850/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,699,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8851/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,699,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8852/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,699,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8853/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,699,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8854/500000]
+ train/ActionNoiseL2Loss=0.0997
+ throughput/total_tokens=1,699,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8855/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,700,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=8856/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=1,700,352,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=8857/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,700,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8858/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,700,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8859/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,700,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8860/500000]
+ optim/total_grad_norm=0.8697
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,701,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8861/500000]
+ train/ActionNoiseL2Loss=0.1418
+ throughput/total_tokens=1,701,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8862/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,701,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8863/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,701,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8864/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,701,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8865/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,702,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8866/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,702,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8867/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,702,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8868/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,702,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8869/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,702,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8870/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,703,040,000
+ throughput/device/tokens_per_second=1,156
+ throughput/device/batches_per_second=0.0482
+ System/Peak GPU Memory (MB)=51,074
+[step=8871/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,703,232,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=8872/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,703,424,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0482
+[step=8873/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,703,616,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=8874/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,703,808,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8875/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,704,000,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8876/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,704,192,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8877/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,704,384,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8878/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,704,576,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8879/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,704,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8880/500000]
+ optim/total_grad_norm=0.6917
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,704,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8881/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,705,152,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8882/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,705,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8883/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=1,705,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8884/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=1,705,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8885/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,705,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8886/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,706,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8887/500000]
+ train/ActionNoiseL2Loss=0.0797
+ throughput/total_tokens=1,706,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8888/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,706,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8889/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,706,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8890/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,706,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8891/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,707,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8892/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,707,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=8893/500000]
+ train/ActionNoiseL2Loss=0.0833
+ throughput/total_tokens=1,707,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8894/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,707,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8895/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,707,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8896/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,708,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8897/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,708,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8898/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,708,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8899/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,708,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8900/500000]
+ optim/total_grad_norm=1.012
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,708,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8901/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,708,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8902/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,709,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8903/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,709,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8904/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,709,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8905/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,709,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8906/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,709,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8907/500000]
+ train/ActionNoiseL2Loss=0.0838
+ throughput/total_tokens=1,710,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8908/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,710,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8909/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,710,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8910/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,710,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8911/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=1,710,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8912/500000]
+ train/ActionNoiseL2Loss=0.0269
+ throughput/total_tokens=1,711,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8913/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,711,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8914/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,711,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8915/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,711,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8916/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,711,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8917/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=1,712,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8918/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,712,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8919/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,712,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=8920/500000]
+ optim/total_grad_norm=0.5171
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,712,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8921/500000]
+ train/ActionNoiseL2Loss=0.1018
+ throughput/total_tokens=1,712,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8922/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,713,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8923/500000]
+ train/ActionNoiseL2Loss=0.0913
+ throughput/total_tokens=1,713,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8924/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=1,713,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8925/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,713,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8926/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,713,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8927/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,713,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8928/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,714,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8929/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,714,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8930/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,714,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8931/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,714,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8932/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,714,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8933/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,715,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8934/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,715,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8935/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,715,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8936/500000]
+ train/ActionNoiseL2Loss=0.0274
+ throughput/total_tokens=1,715,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8937/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,715,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8938/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,716,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8939/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,716,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8940/500000]
+ optim/total_grad_norm=0.6544
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=1,716,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8941/500000]
+ train/ActionNoiseL2Loss=0.1143
+ throughput/total_tokens=1,716,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8942/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,716,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8943/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=1,717,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8944/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,717,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8945/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,717,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8946/500000]
+ train/ActionNoiseL2Loss=0.0890
+ throughput/total_tokens=1,717,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8947/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,717,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8948/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,718,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8949/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,718,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8950/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,718,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8951/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,718,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8952/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,718,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8953/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,718,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8954/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,719,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8955/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,719,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8956/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,719,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8957/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,719,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8958/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,719,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8959/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=1,720,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8960/500000]
+ optim/total_grad_norm=0.7493
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,720,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=8961/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=1,720,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8962/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,720,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8963/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,720,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8964/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,721,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8965/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,721,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8966/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=1,721,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8967/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=1,721,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8968/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,721,856,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=8969/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,722,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=8970/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=1,722,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=8971/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,722,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8972/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,722,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8973/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,722,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8974/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,723,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=8975/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,723,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8976/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,723,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8977/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=1,723,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8978/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,723,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8979/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,723,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8980/500000]
+ optim/total_grad_norm=0.9721
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,724,160,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8981/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,724,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8982/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,724,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8983/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,724,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8984/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,724,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8985/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,725,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8986/500000]
+ train/ActionNoiseL2Loss=0.1020
+ throughput/total_tokens=1,725,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8987/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,725,504,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=8988/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,725,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8989/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,725,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8990/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,726,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=8991/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,726,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8992/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,726,464,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8993/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,726,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8994/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,726,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8995/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,727,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8996/500000]
+ train/ActionNoiseL2Loss=0.1133
+ throughput/total_tokens=1,727,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8997/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,727,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=8998/500000]
+ train/ActionNoiseL2Loss=0.1269
+ throughput/total_tokens=1,727,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=8999/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,727,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9000/500000]
+ optim/total_grad_norm=0.7592
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,728,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/13 [22:14:35] INFO | >> Saving config... checkpoint.py:608
+10/13 [22:15:08] INFO | >> Saving model state... checkpoint.py:796
+10/13 [22:16:20] INFO | >> Saving optim state... checkpoint.py:811
+10/13 [22:17:53] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9001/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=1,728,192,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0473
+[step=9002/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,728,384,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=9003/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,728,576,000
+ throughput/device/tokens_per_second=1,129
+ throughput/device/batches_per_second=0.0470
+[step=9004/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,728,768,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=9005/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,728,960,000
+ throughput/device/tokens_per_second=1,136
+ throughput/device/batches_per_second=0.0474
+[step=9006/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=1,729,152,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=9007/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=1,729,344,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=9008/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,729,536,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=9009/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=1,729,728,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=9010/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,729,920,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=9011/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,730,112,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9012/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,730,304,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9013/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,730,496,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9014/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,730,688,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9015/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,730,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9016/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,731,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9017/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,731,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9018/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,731,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9019/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,731,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9020/500000]
+ optim/total_grad_norm=0.7044
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,731,840,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=9021/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,732,032,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9022/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=1,732,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9023/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,732,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9024/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,732,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9025/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,732,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9026/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,732,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9027/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,733,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9028/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=1,733,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9029/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,733,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9030/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,733,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9031/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=1,733,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9032/500000]
+ train/ActionNoiseL2Loss=0.0261
+ throughput/total_tokens=1,734,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9033/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,734,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9034/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,734,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9035/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=1,734,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9036/500000]
+ train/ActionNoiseL2Loss=0.1526
+ throughput/total_tokens=1,734,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9037/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,735,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9038/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,735,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9039/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,735,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9040/500000]
+ optim/total_grad_norm=0.7141
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,735,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9041/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,735,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9042/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,736,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9043/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=1,736,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9044/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,736,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9045/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=1,736,640,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9046/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,736,832,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9047/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,737,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9048/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,737,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9049/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,737,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9050/500000]
+ train/ActionNoiseL2Loss=0.0962
+ throughput/total_tokens=1,737,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9051/500000]
+ train/ActionNoiseL2Loss=0.1438
+ throughput/total_tokens=1,737,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9052/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,737,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9053/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,738,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9054/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,738,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9055/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,738,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9056/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,738,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9057/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,738,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9058/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=1,739,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9059/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,739,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9060/500000]
+ optim/total_grad_norm=1.254
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,739,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9061/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=1,739,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9062/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,739,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9063/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,740,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9064/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,740,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9065/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,740,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9066/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,740,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9067/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,740,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9068/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,741,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9069/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,741,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9070/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,741,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9071/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,741,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9072/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,741,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9073/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,742,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9074/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,742,208,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9075/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,742,400,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9076/500000]
+ train/ActionNoiseL2Loss=0.0182
+ throughput/total_tokens=1,742,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9077/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=1,742,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9078/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,742,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9079/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,743,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9080/500000]
+ optim/total_grad_norm=0.8883
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,743,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9081/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,743,552,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9082/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,743,744,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9083/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=1,743,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9084/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,744,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9085/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=1,744,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9086/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,744,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9087/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,744,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9088/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,744,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9089/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,745,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9090/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=1,745,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9091/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,745,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9092/500000]
+ train/ActionNoiseL2Loss=0.1165
+ throughput/total_tokens=1,745,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9093/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,745,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9094/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,746,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9095/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,746,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9096/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,746,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9097/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,746,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9098/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,746,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9099/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=1,747,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9100/500000]
+ optim/total_grad_norm=0.7975
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,747,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9101/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,747,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9102/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,747,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9103/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,747,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9104/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,747,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9105/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,748,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9106/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,748,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9107/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,748,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9108/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,748,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9109/500000]
+ train/ActionNoiseL2Loss=0.0933
+ throughput/total_tokens=1,748,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9110/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,749,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9111/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,749,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9112/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,749,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9113/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,749,696,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9114/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,749,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9115/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,750,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9116/500000]
+ train/ActionNoiseL2Loss=0.0779
+ throughput/total_tokens=1,750,272,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9117/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,750,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9118/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,750,656,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9119/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,750,848,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9120/500000]
+ optim/total_grad_norm=0.8641
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,751,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9121/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,751,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9122/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,751,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9123/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,751,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9124/500000]
+ train/ActionNoiseL2Loss=0.0177
+ throughput/total_tokens=1,751,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9125/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,752,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9126/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=1,752,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9127/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=1,752,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9128/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,752,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9129/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,752,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9130/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,752,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9131/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,753,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9132/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,753,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9133/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,753,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9134/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,753,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9135/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,753,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9136/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,754,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9137/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,754,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9138/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=1,754,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9139/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,754,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9140/500000]
+ optim/total_grad_norm=0.9179
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,754,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9141/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=1,755,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9142/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=1,755,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9143/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,755,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9144/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,755,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9145/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=1,755,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9146/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,756,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9147/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,756,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9148/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,756,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9149/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,756,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9150/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=1,756,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9151/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,756,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9152/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,757,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9153/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,757,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9154/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,757,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9155/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=1,757,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9156/500000]
+ train/ActionNoiseL2Loss=0.0946
+ throughput/total_tokens=1,757,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9157/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,758,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9158/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=1,758,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9159/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,758,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9160/500000]
+ optim/total_grad_norm=1.210
+ train/ActionNoiseL2Loss=0.1049
+ throughput/total_tokens=1,758,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9161/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,758,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9162/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=1,759,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9163/500000]
+ train/ActionNoiseL2Loss=0.0823
+ throughput/total_tokens=1,759,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9164/500000]
+ train/ActionNoiseL2Loss=0.0916
+ throughput/total_tokens=1,759,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9165/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,759,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9166/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=1,759,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9167/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,760,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9168/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,760,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9169/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,760,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9170/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=1,760,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9171/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,760,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9172/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=1,761,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9173/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,761,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9174/500000]
+ train/ActionNoiseL2Loss=0.0273
+ throughput/total_tokens=1,761,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9175/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=1,761,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9176/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=1,761,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9177/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,761,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9178/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=1,762,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9179/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,762,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9180/500000]
+ optim/total_grad_norm=0.8130
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,762,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9181/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,762,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9182/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,762,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9183/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=1,763,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9184/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,763,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9185/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=1,763,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9186/500000]
+ train/ActionNoiseL2Loss=0.0288
+ throughput/total_tokens=1,763,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9187/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=1,763,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9188/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,764,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9189/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,764,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9190/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=1,764,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9191/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,764,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9192/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=1,764,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9193/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=1,765,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9194/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=1,765,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9195/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,765,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9196/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,765,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9197/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,765,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9198/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,766,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9199/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,766,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9200/500000]
+ optim/total_grad_norm=1.121
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,766,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9201/500000]
+ train/ActionNoiseL2Loss=0.0954
+ throughput/total_tokens=1,766,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9202/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,766,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9203/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,766,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9204/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,767,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9205/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,767,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9206/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,767,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9207/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,767,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9208/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,767,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9209/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,768,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9210/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,768,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9211/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,768,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9212/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,768,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9213/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=1,768,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9214/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,769,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9215/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,769,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9216/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=1,769,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9217/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,769,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9218/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,769,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9219/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,770,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9220/500000]
+ optim/total_grad_norm=0.7407
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,770,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9221/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,770,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9222/500000]
+ train/ActionNoiseL2Loss=0.1042
+ throughput/total_tokens=1,770,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9223/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,770,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9224/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,771,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9225/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,771,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9226/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,771,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9227/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,771,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9228/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,771,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9229/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=1,771,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9230/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,772,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9231/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,772,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9232/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,772,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9233/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,772,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9234/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,772,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9235/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=1,773,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9236/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,773,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9237/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,773,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9238/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,773,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9239/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,773,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9240/500000]
+ optim/total_grad_norm=1.406
+ train/ActionNoiseL2Loss=0.0955
+ throughput/total_tokens=1,774,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9241/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=1,774,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9242/500000]
+ train/ActionNoiseL2Loss=0.1011
+ throughput/total_tokens=1,774,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9243/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,774,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9244/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,774,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9245/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,775,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9246/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,775,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9247/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=1,775,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9248/500000]
+ train/ActionNoiseL2Loss=0.0959
+ throughput/total_tokens=1,775,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9249/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,775,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9250/500000]
+ train/ActionNoiseL2Loss=0.1226
+ throughput/total_tokens=1,776,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9251/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,776,192,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9252/500000]
+ train/ActionNoiseL2Loss=0.0757
+ throughput/total_tokens=1,776,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9253/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=1,776,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9254/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,776,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9255/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,776,960,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9256/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,777,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9257/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,777,344,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9258/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,777,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9259/500000]
+ train/ActionNoiseL2Loss=0.0819
+ throughput/total_tokens=1,777,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9260/500000]
+ optim/total_grad_norm=0.9794
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=1,777,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9261/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=1,778,112,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9262/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,778,304,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9263/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,778,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9264/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,778,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9265/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,778,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9266/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,779,072,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9267/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,779,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9268/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,779,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9269/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,779,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9270/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,779,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9271/500000]
+ train/ActionNoiseL2Loss=0.1318
+ throughput/total_tokens=1,780,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9272/500000]
+ train/ActionNoiseL2Loss=0.0806
+ throughput/total_tokens=1,780,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9273/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,780,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9274/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,780,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9275/500000]
+ train/ActionNoiseL2Loss=0.1035
+ throughput/total_tokens=1,780,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9276/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=1,780,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9277/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=1,781,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9278/500000]
+ train/ActionNoiseL2Loss=0.0903
+ throughput/total_tokens=1,781,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9279/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,781,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9280/500000]
+ optim/total_grad_norm=0.5929
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,781,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9281/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,781,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9282/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=1,782,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9283/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,782,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9284/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,782,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9285/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,782,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9286/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,782,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9287/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,783,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9288/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=1,783,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9289/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,783,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9290/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,783,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9291/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,783,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9292/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,784,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9293/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,784,256,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9294/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=1,784,448,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9295/500000]
+ train/ActionNoiseL2Loss=0.0845
+ throughput/total_tokens=1,784,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9296/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,784,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9297/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,785,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9298/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,785,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9299/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,785,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9300/500000]
+ optim/total_grad_norm=0.7100
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,785,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9301/500000]
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=1,785,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9302/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,785,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9303/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,786,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9304/500000]
+ train/ActionNoiseL2Loss=0.0588
+ throughput/total_tokens=1,786,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9305/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=1,786,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9306/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,786,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9307/500000]
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=1,786,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9308/500000]
+ train/ActionNoiseL2Loss=0.0685
+ throughput/total_tokens=1,787,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9309/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,787,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9310/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,787,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9311/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,787,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9312/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,787,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9313/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,788,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9314/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,788,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9315/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,788,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9316/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,788,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9317/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=1,788,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9318/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,789,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9319/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=1,789,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9320/500000]
+ optim/total_grad_norm=0.9840
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,789,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9321/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=1,789,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9322/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,789,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9323/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=1,790,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9324/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=1,790,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9325/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,790,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9326/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,790,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9327/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,790,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9328/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,790,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9329/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,791,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9330/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,791,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9331/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,791,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9332/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,791,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9333/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,791,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9334/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,792,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9335/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,792,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9336/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,792,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9337/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,792,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9338/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,792,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9339/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,793,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9340/500000]
+ optim/total_grad_norm=1.175
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,793,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9341/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,793,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9342/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,793,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9343/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,793,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9344/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,794,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9345/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,794,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9346/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,794,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9347/500000]
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,794,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9348/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=1,794,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9349/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,795,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9350/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,795,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9351/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,795,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9352/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=1,795,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9353/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,795,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9354/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,795,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9355/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,796,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9356/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,796,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9357/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=1,796,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9358/500000]
+ train/ActionNoiseL2Loss=0.0333
+ throughput/total_tokens=1,796,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9359/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,796,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9360/500000]
+ optim/total_grad_norm=0.8053
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,797,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9361/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=1,797,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9362/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,797,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9363/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,797,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9364/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,797,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9365/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,798,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9366/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,798,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9367/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,798,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9368/500000]
+ train/ActionNoiseL2Loss=0.1156
+ throughput/total_tokens=1,798,656,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9369/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=1,798,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9370/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=1,799,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9371/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,799,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9372/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,799,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9373/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,799,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9374/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=1,799,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9375/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,800,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9376/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=1,800,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9377/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,800,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9378/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,800,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9379/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,800,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9380/500000]
+ optim/total_grad_norm=1.021
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,800,960,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9381/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,801,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9382/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,801,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9383/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,801,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9384/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,801,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9385/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,801,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9386/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,802,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9387/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,802,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9388/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=1,802,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9389/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,802,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9390/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,802,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9391/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,803,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9392/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,803,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9393/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=1,803,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9394/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,803,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9395/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,803,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9396/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,804,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9397/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=1,804,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9398/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,804,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9399/500000]
+ train/ActionNoiseL2Loss=0.0297
+ throughput/total_tokens=1,804,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9400/500000]
+ optim/total_grad_norm=0.7205
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,804,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9401/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,804,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9402/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,805,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9403/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,805,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9404/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,805,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9405/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,805,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9406/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=1,805,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9407/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=1,806,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9408/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,806,336,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9409/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,806,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9410/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,806,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9411/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,806,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9412/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,807,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9413/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,807,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9414/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,807,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9415/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,807,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9416/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,807,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9417/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,808,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9418/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,808,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9419/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,808,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9420/500000]
+ optim/total_grad_norm=0.6703
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,808,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9421/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,808,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9422/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,809,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9423/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,809,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9424/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,809,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9425/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,809,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9426/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=1,809,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9427/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,809,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9428/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,810,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9429/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=1,810,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9430/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,810,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9431/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,810,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9432/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,810,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9433/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,811,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9434/500000]
+ train/ActionNoiseL2Loss=0.0909
+ throughput/total_tokens=1,811,328,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9435/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,811,520,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9436/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,811,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9437/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,811,904,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9438/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,812,096,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9439/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,812,288,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9440/500000]
+ optim/total_grad_norm=0.8681
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,812,480,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9441/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,812,672,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9442/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,812,864,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9443/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,813,056,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9444/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=1,813,248,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9445/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,813,440,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9446/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=1,813,632,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9447/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,813,824,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9448/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,814,016,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+[step=9449/500000]
+ train/ActionNoiseL2Loss=0.1178
+ throughput/total_tokens=1,814,208,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9450/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,814,400,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9451/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,814,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9452/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,814,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9453/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,814,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9454/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=1,815,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9455/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,815,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9456/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,815,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9457/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,815,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9458/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=1,815,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9459/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=1,816,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9460/500000]
+ optim/total_grad_norm=0.8907
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=1,816,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9461/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=1,816,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9462/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,816,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9463/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=1,816,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9464/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=1,817,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9465/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,817,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9466/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,817,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9467/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,817,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9468/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,817,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9469/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,818,048,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9470/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,818,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9471/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,818,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9472/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,818,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9473/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,818,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9474/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,819,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9475/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,819,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9476/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,819,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9477/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,819,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9478/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,819,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9479/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,819,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9480/500000]
+ optim/total_grad_norm=0.8255
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=1,820,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9481/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,820,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9482/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,820,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9483/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=1,820,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9484/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,820,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9485/500000]
+ train/ActionNoiseL2Loss=0.0842
+ throughput/total_tokens=1,821,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9486/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,821,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9487/500000]
+ train/ActionNoiseL2Loss=0.0315
+ throughput/total_tokens=1,821,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9488/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,821,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9489/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=1,821,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9490/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,822,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9491/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=1,822,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9492/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,822,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9493/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,822,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9494/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,822,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9495/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,823,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9496/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=1,823,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9497/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,823,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9498/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,823,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9499/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=1,823,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9500/500000]
+ optim/total_grad_norm=0.8810
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=1,824,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+10/14 [01:12:58] INFO | >> Saving config... checkpoint.py:608
+10/14 [01:13:41] INFO | >> Saving model state... checkpoint.py:796
+10/14 [01:14:55] INFO | >> Saving optim state... checkpoint.py:811
+10/14 [01:16:31] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=9501/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,824,192,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=9502/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,824,384,000
+ throughput/device/tokens_per_second=1,130
+ throughput/device/batches_per_second=0.0471
+[step=9503/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,824,576,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=9504/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,824,768,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0474
+[step=9505/500000]
+ train/ActionNoiseL2Loss=0.0883
+ throughput/total_tokens=1,824,960,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=9506/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=1,825,152,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=9507/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=1,825,344,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=9508/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,825,536,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9509/500000]
+ train/ActionNoiseL2Loss=0.1094
+ throughput/total_tokens=1,825,728,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9510/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=1,825,920,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=9511/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,826,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9512/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,826,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9513/500000]
+ train/ActionNoiseL2Loss=0.0957
+ throughput/total_tokens=1,826,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9514/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,826,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9515/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,826,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9516/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,827,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9517/500000]
+ train/ActionNoiseL2Loss=0.0808
+ throughput/total_tokens=1,827,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9518/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,827,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9519/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,827,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9520/500000]
+ optim/total_grad_norm=0.7601
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,827,840,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9521/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,828,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9522/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,828,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9523/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,828,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9524/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=1,828,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9525/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=1,828,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9526/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,828,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9527/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,829,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9528/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,829,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9529/500000]
+ train/ActionNoiseL2Loss=0.1434
+ throughput/total_tokens=1,829,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9530/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=1,829,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9531/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,829,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9532/500000]
+ train/ActionNoiseL2Loss=0.0948
+ throughput/total_tokens=1,830,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9533/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,830,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9534/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=1,830,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9535/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=1,830,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9536/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,830,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9537/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,831,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9538/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,831,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9539/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,831,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9540/500000]
+ optim/total_grad_norm=0.6673
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,831,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9541/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=1,831,872,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9542/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=1,832,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9543/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,832,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9544/500000]
+ train/ActionNoiseL2Loss=0.0892
+ throughput/total_tokens=1,832,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9545/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=1,832,640,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9546/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,832,832,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9547/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,833,024,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9548/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=1,833,216,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9549/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=1,833,408,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=9550/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=1,833,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9551/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,833,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9552/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,833,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9553/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,834,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9554/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,834,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9555/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,834,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9556/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,834,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9557/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,834,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9558/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,835,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9559/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,835,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9560/500000]
+ optim/total_grad_norm=0.6995
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,835,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9561/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,835,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9562/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=1,835,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9563/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,836,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9564/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,836,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9565/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,836,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9566/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,836,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9567/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,836,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9568/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,837,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9569/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,837,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9570/500000]
+ train/ActionNoiseL2Loss=0.0340
+ throughput/total_tokens=1,837,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9571/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,837,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9572/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=1,837,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9573/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,838,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9574/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,838,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9575/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,838,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9576/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=1,838,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9577/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,838,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9578/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=1,838,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9579/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=1,839,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9580/500000]
+ optim/total_grad_norm=0.7208
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,839,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9581/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,839,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9582/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,839,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9583/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,839,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9584/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,840,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9585/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,840,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9586/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,840,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9587/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,840,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9588/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,840,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9589/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,841,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9590/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,841,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9591/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=1,841,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9592/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,841,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9593/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=1,841,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9594/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=1,842,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9595/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,842,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9596/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=1,842,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9597/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,842,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9598/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,842,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9599/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,843,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9600/500000]
+ optim/total_grad_norm=0.9291
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,843,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9601/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,843,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9602/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,843,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9603/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,843,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9604/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,843,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9605/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,844,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9606/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,844,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9607/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=1,844,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9608/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=1,844,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9609/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,844,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9610/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,845,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9611/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,845,312,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9612/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,845,504,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9613/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,845,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9614/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=1,845,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9615/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=1,846,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9616/500000]
+ train/ActionNoiseL2Loss=0.0876
+ throughput/total_tokens=1,846,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9617/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=1,846,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9618/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=1,846,656,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9619/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,846,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9620/500000]
+ optim/total_grad_norm=0.9504
+ train/ActionNoiseL2Loss=0.0302
+ throughput/total_tokens=1,847,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9621/500000]
+ train/ActionNoiseL2Loss=0.0920
+ throughput/total_tokens=1,847,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9622/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,847,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9623/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,847,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9624/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=1,847,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9625/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=1,848,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9626/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,848,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9627/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,848,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9628/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=1,848,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9629/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=1,848,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9630/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,848,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9631/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,849,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9632/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=1,849,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9633/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,849,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9634/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,849,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9635/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=1,849,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9636/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,850,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9637/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,850,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9638/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=1,850,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9639/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,850,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9640/500000]
+ optim/total_grad_norm=1.178
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=1,850,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9641/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=1,851,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9642/500000]
+ train/ActionNoiseL2Loss=0.1087
+ throughput/total_tokens=1,851,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9643/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,851,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9644/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,851,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9645/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,851,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9646/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,852,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9647/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,852,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9648/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,852,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9649/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,852,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9650/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,852,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9651/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,852,992,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9652/500000]
+ train/ActionNoiseL2Loss=0.0370
+ throughput/total_tokens=1,853,184,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9653/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,853,376,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9654/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,853,568,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9655/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,853,760,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9656/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,853,952,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9657/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=1,854,144,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9658/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=1,854,336,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9659/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,854,528,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9660/500000]
+ optim/total_grad_norm=0.9535
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=1,854,720,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=9661/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=1,854,912,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9662/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,855,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9663/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=1,855,296,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9664/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,855,488,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9665/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=1,855,680,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9666/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,855,872,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9667/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,856,064,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=9668/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,856,256,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9669/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=1,856,448,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=9670/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,856,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9671/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,856,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9672/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=1,857,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9673/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,857,216,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9674/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=1,857,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9675/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,857,600,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9676/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,857,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9677/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=1,857,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9678/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,858,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9679/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,858,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9680/500000]
+ optim/total_grad_norm=0.8665
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,858,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9681/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,858,752,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9682/500000]
+ train/ActionNoiseL2Loss=0.1070
+ throughput/total_tokens=1,858,944,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9683/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=1,859,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9684/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,859,328,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9685/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=1,859,520,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9686/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,859,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9687/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=1,859,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9688/500000]
+ train/ActionNoiseL2Loss=0.0977
+ throughput/total_tokens=1,860,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9689/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,860,288,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9690/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,860,480,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9691/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,860,672,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9692/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,860,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9693/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=1,861,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9694/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,861,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9695/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,861,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9696/500000]
+ train/ActionNoiseL2Loss=0.0718
+ throughput/total_tokens=1,861,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9697/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,861,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9698/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,862,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9699/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=1,862,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9700/500000]
+ optim/total_grad_norm=1.217
+ train/ActionNoiseL2Loss=0.1158
+ throughput/total_tokens=1,862,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9701/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,862,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9702/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,862,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9703/500000]
+ train/ActionNoiseL2Loss=0.0735
+ throughput/total_tokens=1,862,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9704/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,863,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9705/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,863,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9706/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=1,863,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9707/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,863,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9708/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,863,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9709/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,864,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9710/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=1,864,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9711/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,864,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9712/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=1,864,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9713/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,864,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9714/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,865,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9715/500000]
+ train/ActionNoiseL2Loss=0.0877
+ throughput/total_tokens=1,865,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9716/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,865,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9717/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,865,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9718/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,865,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9719/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=1,866,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9720/500000]
+ optim/total_grad_norm=0.6814
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,866,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9721/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,866,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9722/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,866,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9723/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,866,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9724/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=1,867,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9725/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,867,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9726/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,867,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9727/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,867,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9728/500000]
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,867,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9729/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=1,867,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9730/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=1,868,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9731/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,868,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9732/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,868,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9733/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,868,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9734/500000]
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=1,868,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9735/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,869,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9736/500000]
+ train/ActionNoiseL2Loss=0.1031
+ throughput/total_tokens=1,869,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9737/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,869,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9738/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=1,869,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9739/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=1,869,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9740/500000]
+ optim/total_grad_norm=0.7325
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,870,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9741/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,870,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9742/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=1,870,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9743/500000]
+ train/ActionNoiseL2Loss=0.0800
+ throughput/total_tokens=1,870,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9744/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,870,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9745/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=1,871,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9746/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=1,871,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9747/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,871,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9748/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,871,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9749/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,871,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9750/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,872,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9751/500000]
+ train/ActionNoiseL2Loss=0.0987
+ throughput/total_tokens=1,872,192,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9752/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,872,384,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9753/500000]
+ train/ActionNoiseL2Loss=0.1280
+ throughput/total_tokens=1,872,576,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9754/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,872,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9755/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=1,872,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9756/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,873,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9757/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,873,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9758/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=1,873,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9759/500000]
+ train/ActionNoiseL2Loss=0.0339
+ throughput/total_tokens=1,873,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9760/500000]
+ optim/total_grad_norm=1.054
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=1,873,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9761/500000]
+ train/ActionNoiseL2Loss=0.0768
+ throughput/total_tokens=1,874,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9762/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,874,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9763/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=1,874,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9764/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=1,874,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9765/500000]
+ train/ActionNoiseL2Loss=0.1002
+ throughput/total_tokens=1,874,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9766/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,875,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9767/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,875,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9768/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,875,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9769/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=1,875,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9770/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,875,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9771/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,876,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9772/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,876,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9773/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,876,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9774/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,876,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9775/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=1,876,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9776/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,876,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9777/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,877,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9778/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=1,877,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9779/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,877,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9780/500000]
+ optim/total_grad_norm=0.5643
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,877,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9781/500000]
+ train/ActionNoiseL2Loss=0.0295
+ throughput/total_tokens=1,877,952,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9782/500000]
+ train/ActionNoiseL2Loss=0.1330
+ throughput/total_tokens=1,878,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9783/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,878,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9784/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=1,878,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9785/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,878,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9786/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=1,878,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9787/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,879,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9788/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,879,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9789/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,879,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9790/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,879,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9791/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,879,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9792/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,880,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9793/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,880,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9794/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=1,880,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9795/500000]
+ train/ActionNoiseL2Loss=0.0810
+ throughput/total_tokens=1,880,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9796/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,880,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9797/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,881,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9798/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=1,881,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9799/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=1,881,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9800/500000]
+ optim/total_grad_norm=0.6055
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=1,881,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9801/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=1,881,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9802/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,881,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9803/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=1,882,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9804/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=1,882,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9805/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,882,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9806/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,882,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9807/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,882,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9808/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=1,883,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9809/500000]
+ train/ActionNoiseL2Loss=0.0186
+ throughput/total_tokens=1,883,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9810/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,883,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=9811/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=1,883,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9812/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,883,904,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9813/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=1,884,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9814/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=1,884,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9815/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=1,884,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9816/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,884,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9817/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=1,884,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9818/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,885,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9819/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=1,885,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9820/500000]
+ optim/total_grad_norm=0.6123
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,885,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9821/500000]
+ train/ActionNoiseL2Loss=0.0835
+ throughput/total_tokens=1,885,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9822/500000]
+ train/ActionNoiseL2Loss=0.1401
+ throughput/total_tokens=1,885,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9823/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,886,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9824/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=1,886,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9825/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,886,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9826/500000]
+ train/ActionNoiseL2Loss=0.1044
+ throughput/total_tokens=1,886,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9827/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,886,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9828/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,886,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9829/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,887,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9830/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=1,887,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9831/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,887,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9832/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,887,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9833/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,887,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9834/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=1,888,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9835/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,888,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9836/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,888,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9837/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,888,704,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9838/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,888,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9839/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=1,889,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9840/500000]
+ optim/total_grad_norm=0.9200
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=1,889,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9841/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=1,889,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9842/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,889,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9843/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,889,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9844/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=1,890,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9845/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,890,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9846/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,890,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9847/500000]
+ train/ActionNoiseL2Loss=0.0889
+ throughput/total_tokens=1,890,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9848/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=1,890,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9849/500000]
+ train/ActionNoiseL2Loss=0.1043
+ throughput/total_tokens=1,891,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9850/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,891,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9851/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,891,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9852/500000]
+ train/ActionNoiseL2Loss=0.0825
+ throughput/total_tokens=1,891,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9853/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=1,891,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9854/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,891,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9855/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,892,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9856/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,892,352,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9857/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,892,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9858/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,892,736,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9859/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,892,928,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9860/500000]
+ optim/total_grad_norm=0.7429
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=1,893,120,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=9861/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,893,312,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9862/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,893,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9863/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=1,893,696,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9864/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,893,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9865/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,894,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9866/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,894,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9867/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=1,894,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9868/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,894,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9869/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,894,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9870/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,895,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9871/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=1,895,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9872/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=1,895,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9873/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,895,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9874/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=1,895,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9875/500000]
+ train/ActionNoiseL2Loss=0.1163
+ throughput/total_tokens=1,896,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9876/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,896,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9877/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,896,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9878/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,896,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9879/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=1,896,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9880/500000]
+ optim/total_grad_norm=0.5717
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,896,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9881/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,897,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9882/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,897,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9883/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=1,897,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9884/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,897,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9885/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=1,897,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9886/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=1,898,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9887/500000]
+ train/ActionNoiseL2Loss=0.0237
+ throughput/total_tokens=1,898,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9888/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,898,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9889/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,898,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9890/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=1,898,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9891/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=1,899,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9892/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,899,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9893/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,899,456,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9894/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,899,648,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9895/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,899,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9896/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,900,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9897/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,900,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9898/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=1,900,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9899/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=1,900,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9900/500000]
+ optim/total_grad_norm=0.6388
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,900,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9901/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,900,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9902/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=1,901,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9903/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,901,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9904/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,901,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9905/500000]
+ train/ActionNoiseL2Loss=0.0185
+ throughput/total_tokens=1,901,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9906/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,901,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9907/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=1,902,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9908/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=1,902,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9909/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,902,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9910/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=1,902,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9911/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,902,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9912/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,903,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9913/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=1,903,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9914/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,903,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=9915/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,903,680,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9916/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=1,903,872,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9917/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=1,904,064,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9918/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,904,256,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=9919/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=1,904,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=9920/500000]
+ optim/total_grad_norm=0.4102
+ train/ActionNoiseL2Loss=0.0386
+ throughput/total_tokens=1,904,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9921/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=1,904,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9922/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=1,905,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9923/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,905,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9924/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=1,905,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9925/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=1,905,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9926/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,905,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9927/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=1,905,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9928/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=1,906,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9929/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,906,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9930/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,906,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9931/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=1,906,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9932/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=1,906,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9933/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=1,907,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9934/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,907,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9935/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,907,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9936/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,907,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9937/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=1,907,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9938/500000]
+ train/ActionNoiseL2Loss=0.0184
+ throughput/total_tokens=1,908,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9939/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,908,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9940/500000]
+ optim/total_grad_norm=1.313
+ train/ActionNoiseL2Loss=0.0777
+ throughput/total_tokens=1,908,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9941/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,908,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9942/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,908,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9943/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,909,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9944/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,909,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9945/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=1,909,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9946/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=1,909,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9947/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,909,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9948/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=1,910,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9949/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,910,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9950/500000]
+ train/ActionNoiseL2Loss=0.0263
+ throughput/total_tokens=1,910,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=9951/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=1,910,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9952/500000]
+ train/ActionNoiseL2Loss=0.0458
+ throughput/total_tokens=1,910,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9953/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=1,910,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9954/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,911,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9955/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=1,911,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9956/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=1,911,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9957/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=1,911,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9958/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=1,911,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9959/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=1,912,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9960/500000]
+ optim/total_grad_norm=0.7172
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,912,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=9961/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,912,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9962/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,912,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9963/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=1,912,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9964/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=1,913,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9965/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,913,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9966/500000]
+ train/ActionNoiseL2Loss=0.1077
+ throughput/total_tokens=1,913,472,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9967/500000]
+ train/ActionNoiseL2Loss=0.0834
+ throughput/total_tokens=1,913,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9968/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=1,913,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9969/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,914,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=9970/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,914,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9971/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=1,914,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=9972/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=1,914,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9973/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=1,914,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9974/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=1,915,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9975/500000]
+ train/ActionNoiseL2Loss=0.1322
+ throughput/total_tokens=1,915,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9976/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=1,915,392,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9977/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=1,915,584,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9978/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,915,776,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=9979/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=1,915,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9980/500000]
+ optim/total_grad_norm=0.7468
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,916,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9981/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,916,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9982/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,916,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9983/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,916,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=9984/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,916,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9985/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=1,917,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9986/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=1,917,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9987/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,917,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9988/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=1,917,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9989/500000]
+ train/ActionNoiseL2Loss=0.0257
+ throughput/total_tokens=1,917,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9990/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=1,918,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=9991/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,918,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9992/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,918,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=9993/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,918,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=9994/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=1,918,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9995/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=1,919,040,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9996/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=1,919,232,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9997/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,919,424,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9998/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,919,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=9999/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=1,919,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10000/500000]
+ optim/total_grad_norm=1.084
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=1,920,000,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+10/14 [04:11:41] INFO | >> Saving config... checkpoint.py:608
+10/14 [04:12:32] INFO | >> Saving model state... checkpoint.py:796
+10/14 [04:13:40] INFO | >> Saving optim state... checkpoint.py:811
+10/14 [04:15:15] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10001/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,920,192,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0471
+[step=10002/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=1,920,384,000
+ throughput/device/tokens_per_second=1,140
+ throughput/device/batches_per_second=0.0475
+[step=10003/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,920,576,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10004/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=1,920,768,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10005/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,920,960,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10006/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,921,152,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10007/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=1,921,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10008/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=1,921,536,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10009/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=1,921,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10010/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=1,921,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10011/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=1,922,112,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10012/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=1,922,304,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10013/500000]
+ train/ActionNoiseL2Loss=0.0443
+ throughput/total_tokens=1,922,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10014/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=1,922,688,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10015/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,922,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10016/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,923,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10017/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=1,923,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10018/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=1,923,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10019/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,923,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10020/500000]
+ optim/total_grad_norm=0.8550
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=1,923,840,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10021/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=1,924,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10022/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,924,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10023/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=1,924,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10024/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=1,924,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10025/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,924,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10026/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,924,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10027/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,925,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10028/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,925,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10029/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=1,925,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10030/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=1,925,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10031/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=1,925,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10032/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=1,926,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10033/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,926,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10034/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=1,926,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10035/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,926,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10036/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,926,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10037/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=1,927,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10038/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=1,927,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10039/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=1,927,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10040/500000]
+ optim/total_grad_norm=0.7722
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,927,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10041/500000]
+ train/ActionNoiseL2Loss=0.0234
+ throughput/total_tokens=1,927,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10042/500000]
+ train/ActionNoiseL2Loss=0.1312
+ throughput/total_tokens=1,928,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10043/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=1,928,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10044/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=1,928,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10045/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,928,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10046/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,928,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10047/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=1,929,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10048/500000]
+ train/ActionNoiseL2Loss=0.0895
+ throughput/total_tokens=1,929,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10049/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=1,929,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10050/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,929,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10051/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=1,929,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10052/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,929,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10053/500000]
+ train/ActionNoiseL2Loss=0.0772
+ throughput/total_tokens=1,930,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10054/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,930,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10055/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=1,930,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10056/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,930,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10057/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,930,944,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10058/500000]
+ train/ActionNoiseL2Loss=0.0224
+ throughput/total_tokens=1,931,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10059/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,931,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10060/500000]
+ optim/total_grad_norm=0.5317
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=1,931,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=10061/500000]
+ train/ActionNoiseL2Loss=0.1807
+ throughput/total_tokens=1,931,712,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10062/500000]
+ train/ActionNoiseL2Loss=0.0307
+ throughput/total_tokens=1,931,904,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10063/500000]
+ train/ActionNoiseL2Loss=0.0885
+ throughput/total_tokens=1,932,096,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10064/500000]
+ train/ActionNoiseL2Loss=0.0331
+ throughput/total_tokens=1,932,288,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10065/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,932,480,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10066/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=1,932,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10067/500000]
+ train/ActionNoiseL2Loss=0.0884
+ throughput/total_tokens=1,932,864,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10068/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,933,056,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10069/500000]
+ train/ActionNoiseL2Loss=0.1362
+ throughput/total_tokens=1,933,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10070/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,933,440,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10071/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,933,632,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10072/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=1,933,824,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10073/500000]
+ train/ActionNoiseL2Loss=0.0308
+ throughput/total_tokens=1,934,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10074/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,934,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10075/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=1,934,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10076/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,934,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10077/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,934,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10078/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=1,934,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10079/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=1,935,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10080/500000]
+ optim/total_grad_norm=1.041
+ train/ActionNoiseL2Loss=0.0760
+ throughput/total_tokens=1,935,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10081/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,935,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10082/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=1,935,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10083/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,935,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10084/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,936,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10085/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,936,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10086/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=1,936,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10087/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=1,936,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10088/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,936,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10089/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=1,937,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10090/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=1,937,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10091/500000]
+ train/ActionNoiseL2Loss=0.0958
+ throughput/total_tokens=1,937,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10092/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,937,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10093/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,937,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10094/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,938,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10095/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=1,938,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10096/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=1,938,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10097/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,938,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10098/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=1,938,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10099/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=1,939,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10100/500000]
+ optim/total_grad_norm=0.6376
+ train/ActionNoiseL2Loss=0.0328
+ throughput/total_tokens=1,939,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10101/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=1,939,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10102/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,939,584,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10103/500000]
+ train/ActionNoiseL2Loss=0.0656
+ throughput/total_tokens=1,939,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10104/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,939,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10105/500000]
+ train/ActionNoiseL2Loss=0.0255
+ throughput/total_tokens=1,940,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10106/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=1,940,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10107/500000]
+ train/ActionNoiseL2Loss=0.0886
+ throughput/total_tokens=1,940,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10108/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=1,940,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10109/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=1,940,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10110/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,941,120,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=10111/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,941,312,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10112/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,941,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10113/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,941,696,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10114/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=1,941,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10115/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=1,942,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10116/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=1,942,272,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10117/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=1,942,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10118/500000]
+ train/ActionNoiseL2Loss=0.0243
+ throughput/total_tokens=1,942,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10119/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,942,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10120/500000]
+ optim/total_grad_norm=1.279
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,943,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10121/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=1,943,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10122/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,943,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10123/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=1,943,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10124/500000]
+ train/ActionNoiseL2Loss=0.1065
+ throughput/total_tokens=1,943,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10125/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=1,944,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10126/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,944,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10127/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=1,944,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10128/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,944,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10129/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=1,944,768,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10130/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=1,944,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10131/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=1,945,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10132/500000]
+ train/ActionNoiseL2Loss=0.0698
+ throughput/total_tokens=1,945,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10133/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=1,945,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10134/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,945,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10135/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,945,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10136/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=1,946,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10137/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=1,946,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10138/500000]
+ train/ActionNoiseL2Loss=0.0654
+ throughput/total_tokens=1,946,496,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10139/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=1,946,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10140/500000]
+ optim/total_grad_norm=0.8540
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,946,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10141/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,947,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10142/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,947,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10143/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,947,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10144/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=1,947,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10145/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=1,947,840,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10146/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=1,948,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10147/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=1,948,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10148/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=1,948,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10149/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=1,948,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10150/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=1,948,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10151/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=1,948,992,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10152/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=1,949,184,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10153/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=1,949,376,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10154/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=1,949,568,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10155/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,949,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10156/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=1,949,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10157/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,950,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10158/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,950,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10159/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=1,950,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10160/500000]
+ optim/total_grad_norm=0.5886
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=1,950,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10161/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=1,950,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10162/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=1,951,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10163/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=1,951,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10164/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=1,951,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10165/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,951,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10166/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=1,951,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10167/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=1,952,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10168/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,952,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10169/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=1,952,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10170/500000]
+ train/ActionNoiseL2Loss=0.0915
+ throughput/total_tokens=1,952,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10171/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=1,952,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10172/500000]
+ train/ActionNoiseL2Loss=0.0908
+ throughput/total_tokens=1,953,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10173/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,953,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10174/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=1,953,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10175/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=1,953,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10176/500000]
+ train/ActionNoiseL2Loss=0.0944
+ throughput/total_tokens=1,953,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10177/500000]
+ train/ActionNoiseL2Loss=0.1137
+ throughput/total_tokens=1,953,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10178/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=1,954,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10179/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=1,954,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10180/500000]
+ optim/total_grad_norm=0.8266
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=1,954,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10181/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=1,954,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10182/500000]
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=1,954,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10183/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=1,955,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10184/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=1,955,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10185/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=1,955,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10186/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=1,955,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10187/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=1,955,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10188/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=1,956,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10189/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,956,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10190/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=1,956,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10191/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=1,956,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10192/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=1,956,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10193/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,957,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10194/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=1,957,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10195/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=1,957,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10196/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=1,957,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10197/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=1,957,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10198/500000]
+ train/ActionNoiseL2Loss=0.0928
+ throughput/total_tokens=1,958,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10199/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,958,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10200/500000]
+ optim/total_grad_norm=0.8006
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,958,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10201/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=1,958,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10202/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=1,958,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10203/500000]
+ train/ActionNoiseL2Loss=0.0165
+ throughput/total_tokens=1,958,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10204/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,959,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10205/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=1,959,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10206/500000]
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=1,959,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10207/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,959,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10208/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=1,959,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10209/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,960,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10210/500000]
+ train/ActionNoiseL2Loss=0.0776
+ throughput/total_tokens=1,960,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10211/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=1,960,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10212/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,960,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10213/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=1,960,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10214/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,961,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10215/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=1,961,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10216/500000]
+ train/ActionNoiseL2Loss=0.0988
+ throughput/total_tokens=1,961,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10217/500000]
+ train/ActionNoiseL2Loss=0.0282
+ throughput/total_tokens=1,961,664,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10218/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=1,961,856,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10219/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,962,048,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10220/500000]
+ optim/total_grad_norm=0.7721
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=1,962,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10221/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=1,962,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10222/500000]
+ train/ActionNoiseL2Loss=0.1151
+ throughput/total_tokens=1,962,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10223/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=1,962,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10224/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,963,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10225/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=1,963,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10226/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=1,963,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10227/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=1,963,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10228/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,963,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10229/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,963,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10230/500000]
+ train/ActionNoiseL2Loss=0.0866
+ throughput/total_tokens=1,964,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10231/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=1,964,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10232/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=1,964,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10233/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=1,964,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10234/500000]
+ train/ActionNoiseL2Loss=0.0512
+ throughput/total_tokens=1,964,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10235/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=1,965,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10236/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,965,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10237/500000]
+ train/ActionNoiseL2Loss=0.0979
+ throughput/total_tokens=1,965,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10238/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=1,965,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10239/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=1,965,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10240/500000]
+ optim/total_grad_norm=0.6304
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,966,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10241/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=1,966,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10242/500000]
+ train/ActionNoiseL2Loss=0.0717
+ throughput/total_tokens=1,966,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10243/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=1,966,656,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10244/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=1,966,848,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10245/500000]
+ train/ActionNoiseL2Loss=0.0854
+ throughput/total_tokens=1,967,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10246/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,967,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10247/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,967,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10248/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,967,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10249/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=1,967,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10250/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=1,968,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10251/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=1,968,192,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10252/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=1,968,384,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10253/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=1,968,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10254/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=1,968,768,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10255/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,968,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10256/500000]
+ train/ActionNoiseL2Loss=0.0449
+ throughput/total_tokens=1,969,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10257/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=1,969,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10258/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=1,969,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10259/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,969,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10260/500000]
+ optim/total_grad_norm=0.5086
+ train/ActionNoiseL2Loss=0.0216
+ throughput/total_tokens=1,969,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10261/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,970,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10262/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=1,970,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10263/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=1,970,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10264/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=1,970,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10265/500000]
+ train/ActionNoiseL2Loss=0.1096
+ throughput/total_tokens=1,970,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10266/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,971,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10267/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=1,971,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10268/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=1,971,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10269/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=1,971,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10270/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=1,971,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10271/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=1,972,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10272/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=1,972,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10273/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=1,972,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10274/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=1,972,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10275/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=1,972,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10276/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=1,972,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10277/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=1,973,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10278/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=1,973,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10279/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,973,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10280/500000]
+ optim/total_grad_norm=0.4467
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=1,973,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10281/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=1,973,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10282/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=1,974,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10283/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=1,974,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10284/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=1,974,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10285/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=1,974,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10286/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=1,974,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10287/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=1,975,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10288/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=1,975,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10289/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,975,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10290/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=1,975,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10291/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=1,975,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10292/500000]
+ train/ActionNoiseL2Loss=0.0964
+ throughput/total_tokens=1,976,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10293/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,976,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10294/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=1,976,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10295/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=1,976,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10296/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=1,976,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10297/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=1,977,024,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10298/500000]
+ train/ActionNoiseL2Loss=0.0369
+ throughput/total_tokens=1,977,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10299/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,977,408,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10300/500000]
+ optim/total_grad_norm=0.7108
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=1,977,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10301/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=1,977,792,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10302/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=1,977,984,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10303/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=1,978,176,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10304/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=1,978,368,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10305/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=1,978,560,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10306/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=1,978,752,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10307/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=1,978,944,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10308/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=1,979,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10309/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=1,979,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10310/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=1,979,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10311/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=1,979,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10312/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=1,979,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10313/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=1,980,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10314/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=1,980,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10315/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=1,980,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10316/500000]
+ train/ActionNoiseL2Loss=0.0609
+ throughput/total_tokens=1,980,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10317/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,980,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10318/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=1,981,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10319/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=1,981,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10320/500000]
+ optim/total_grad_norm=0.9065
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=1,981,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10321/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=1,981,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10322/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=1,981,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10323/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=1,982,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10324/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=1,982,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10325/500000]
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=1,982,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10326/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=1,982,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10327/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=1,982,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10328/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=1,982,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10329/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=1,983,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10330/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=1,983,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10331/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=1,983,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10332/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,983,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10333/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=1,983,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10334/500000]
+ train/ActionNoiseL2Loss=0.0951
+ throughput/total_tokens=1,984,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10335/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=1,984,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10336/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=1,984,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10337/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=1,984,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10338/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=1,984,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10339/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=1,985,088,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10340/500000]
+ optim/total_grad_norm=0.6938
+ train/ActionNoiseL2Loss=0.0318
+ throughput/total_tokens=1,985,280,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10341/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=1,985,472,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10342/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=1,985,664,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10343/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=1,985,856,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10344/500000]
+ train/ActionNoiseL2Loss=0.0414
+ throughput/total_tokens=1,986,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10345/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=1,986,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10346/500000]
+ train/ActionNoiseL2Loss=0.0232
+ throughput/total_tokens=1,986,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10347/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=1,986,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10348/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=1,986,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10349/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=1,987,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10350/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=1,987,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10351/500000]
+ train/ActionNoiseL2Loss=0.0850
+ throughput/total_tokens=1,987,392,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10352/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,987,584,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10353/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=1,987,776,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10354/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=1,987,968,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10355/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=1,988,160,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10356/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=1,988,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10357/500000]
+ train/ActionNoiseL2Loss=0.0705
+ throughput/total_tokens=1,988,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10358/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=1,988,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10359/500000]
+ train/ActionNoiseL2Loss=0.0981
+ throughput/total_tokens=1,988,928,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10360/500000]
+ optim/total_grad_norm=0.8478
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=1,989,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10361/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=1,989,312,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10362/500000]
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=1,989,504,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10363/500000]
+ train/ActionNoiseL2Loss=0.1078
+ throughput/total_tokens=1,989,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10364/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=1,989,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10365/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=1,990,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10366/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=1,990,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10367/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=1,990,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10368/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=1,990,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10369/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=1,990,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10370/500000]
+ train/ActionNoiseL2Loss=0.0868
+ throughput/total_tokens=1,991,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10371/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=1,991,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10372/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=1,991,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10373/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=1,991,616,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10374/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,991,808,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10375/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=1,992,000,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10376/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=1,992,192,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10377/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,992,384,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10378/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=1,992,576,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10379/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=1,992,768,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10380/500000]
+ optim/total_grad_norm=0.7922
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=1,992,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10381/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,993,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10382/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=1,993,344,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10383/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=1,993,536,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10384/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=1,993,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10385/500000]
+ train/ActionNoiseL2Loss=0.0727
+ throughput/total_tokens=1,993,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10386/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=1,994,112,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10387/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=1,994,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10388/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=1,994,496,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10389/500000]
+ train/ActionNoiseL2Loss=0.0488
+ throughput/total_tokens=1,994,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10390/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=1,994,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10391/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=1,995,072,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10392/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=1,995,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10393/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=1,995,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10394/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=1,995,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10395/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=1,995,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10396/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=1,996,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10397/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=1,996,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10398/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=1,996,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10399/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=1,996,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10400/500000]
+ optim/total_grad_norm=0.7413
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=1,996,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10401/500000]
+ train/ActionNoiseL2Loss=0.0799
+ throughput/total_tokens=1,996,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10402/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=1,997,184,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10403/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=1,997,376,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10404/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=1,997,568,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10405/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=1,997,760,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10406/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=1,997,952,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10407/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=1,998,144,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10408/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=1,998,336,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10409/500000]
+ train/ActionNoiseL2Loss=0.0844
+ throughput/total_tokens=1,998,528,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10410/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=1,998,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=10411/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=1,998,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10412/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=1,999,104,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10413/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=1,999,296,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10414/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=1,999,488,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10415/500000]
+ train/ActionNoiseL2Loss=0.1075
+ throughput/total_tokens=1,999,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10416/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=1,999,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10417/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,000,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10418/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,000,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10419/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=2,000,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10420/500000]
+ optim/total_grad_norm=0.7811
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=2,000,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10421/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,000,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10422/500000]
+ train/ActionNoiseL2Loss=0.0899
+ throughput/total_tokens=2,001,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10423/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,001,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10424/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,001,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10425/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,001,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10426/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=2,001,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10427/500000]
+ train/ActionNoiseL2Loss=0.0684
+ throughput/total_tokens=2,001,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10428/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=2,002,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10429/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=2,002,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10430/500000]
+ train/ActionNoiseL2Loss=0.0887
+ throughput/total_tokens=2,002,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10431/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,002,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10432/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,002,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10433/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=2,003,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10434/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=2,003,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10435/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,003,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10436/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=2,003,712,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10437/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,003,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10438/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,004,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10439/500000]
+ train/ActionNoiseL2Loss=0.0993
+ throughput/total_tokens=2,004,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10440/500000]
+ optim/total_grad_norm=1.067
+ train/ActionNoiseL2Loss=0.0583
+ throughput/total_tokens=2,004,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10441/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=2,004,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10442/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,004,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10443/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,005,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10444/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,005,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10445/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,005,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10446/500000]
+ train/ActionNoiseL2Loss=0.0875
+ throughput/total_tokens=2,005,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10447/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=2,005,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10448/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,006,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10449/500000]
+ train/ActionNoiseL2Loss=0.0252
+ throughput/total_tokens=2,006,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10450/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=2,006,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10451/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=2,006,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10452/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,006,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10453/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=2,006,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10454/500000]
+ train/ActionNoiseL2Loss=0.0796
+ throughput/total_tokens=2,007,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10455/500000]
+ train/ActionNoiseL2Loss=0.0956
+ throughput/total_tokens=2,007,360,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10456/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=2,007,552,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10457/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,007,744,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10458/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,007,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10459/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=2,008,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10460/500000]
+ optim/total_grad_norm=1.255
+ train/ActionNoiseL2Loss=0.1099
+ throughput/total_tokens=2,008,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10461/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=2,008,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10462/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,008,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10463/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=2,008,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10464/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=2,009,088,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10465/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,009,280,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10466/500000]
+ train/ActionNoiseL2Loss=0.0747
+ throughput/total_tokens=2,009,472,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10467/500000]
+ train/ActionNoiseL2Loss=0.0804
+ throughput/total_tokens=2,009,664,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10468/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,009,856,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10469/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,010,048,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10470/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,010,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10471/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,010,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10472/500000]
+ train/ActionNoiseL2Loss=0.0984
+ throughput/total_tokens=2,010,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10473/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=2,010,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10474/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,011,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10475/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,011,200,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10476/500000]
+ train/ActionNoiseL2Loss=0.1243
+ throughput/total_tokens=2,011,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10477/500000]
+ train/ActionNoiseL2Loss=0.0694
+ throughput/total_tokens=2,011,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10478/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=2,011,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10479/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=2,011,968,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10480/500000]
+ optim/total_grad_norm=0.6595
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,012,160,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10481/500000]
+ train/ActionNoiseL2Loss=0.0733
+ throughput/total_tokens=2,012,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10482/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,012,544,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10483/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=2,012,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10484/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,012,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10485/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=2,013,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10486/500000]
+ train/ActionNoiseL2Loss=0.0697
+ throughput/total_tokens=2,013,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10487/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=2,013,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10488/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,013,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10489/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,013,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10490/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,014,080,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10491/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,014,272,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10492/500000]
+ train/ActionNoiseL2Loss=0.1067
+ throughput/total_tokens=2,014,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10493/500000]
+ train/ActionNoiseL2Loss=0.1279
+ throughput/total_tokens=2,014,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10494/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,014,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10495/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,015,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10496/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,015,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10497/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=2,015,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10498/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=2,015,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10499/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,015,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10500/500000]
+ optim/total_grad_norm=0.6505
+ train/ActionNoiseL2Loss=0.0952
+ throughput/total_tokens=2,016,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/14 [07:10:30] INFO | >> Saving config... checkpoint.py:608
+10/14 [07:11:03] INFO | >> Saving model state... checkpoint.py:796
+10/14 [07:12:14] INFO | >> Saving optim state... checkpoint.py:811
+10/14 [07:13:45] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=10501/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,016,192,000
+ throughput/device/tokens_per_second=1,128
+ throughput/device/batches_per_second=0.0470
+[step=10502/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=2,016,384,000
+ throughput/device/tokens_per_second=1,138
+ throughput/device/batches_per_second=0.0475
+[step=10503/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=2,016,576,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=10504/500000]
+ train/ActionNoiseL2Loss=0.1132
+ throughput/total_tokens=2,016,768,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10505/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,016,960,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10506/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,017,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10507/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=2,017,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10508/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=2,017,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10509/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=2,017,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10510/500000]
+ train/ActionNoiseL2Loss=0.0766
+ throughput/total_tokens=2,017,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10511/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=2,018,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10512/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=2,018,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10513/500000]
+ train/ActionNoiseL2Loss=0.0227
+ throughput/total_tokens=2,018,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10514/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=2,018,688,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10515/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,018,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10516/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=2,019,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10517/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,019,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10518/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,019,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10519/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=2,019,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10520/500000]
+ optim/total_grad_norm=0.7281
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,019,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10521/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=2,020,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10522/500000]
+ train/ActionNoiseL2Loss=0.1110
+ throughput/total_tokens=2,020,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10523/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,020,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10524/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,020,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10525/500000]
+ train/ActionNoiseL2Loss=0.1144
+ throughput/total_tokens=2,020,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10526/500000]
+ train/ActionNoiseL2Loss=0.0949
+ throughput/total_tokens=2,020,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10527/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=2,021,184,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10528/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=2,021,376,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10529/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,021,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10530/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=2,021,760,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10531/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,021,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10532/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,022,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10533/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=2,022,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10534/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=2,022,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10535/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=2,022,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10536/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=2,022,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10537/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=2,023,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10538/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=2,023,296,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10539/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,023,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10540/500000]
+ optim/total_grad_norm=1.051
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=2,023,680,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10541/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=2,023,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10542/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=2,024,064,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10543/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=2,024,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10544/500000]
+ train/ActionNoiseL2Loss=0.0813
+ throughput/total_tokens=2,024,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10545/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,024,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10546/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=2,024,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10547/500000]
+ train/ActionNoiseL2Loss=0.0199
+ throughput/total_tokens=2,025,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10548/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,025,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10549/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,025,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10550/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=2,025,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10551/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,025,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10552/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,025,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10553/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,026,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10554/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,026,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10555/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,026,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10556/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=2,026,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10557/500000]
+ train/ActionNoiseL2Loss=0.0746
+ throughput/total_tokens=2,026,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10558/500000]
+ train/ActionNoiseL2Loss=0.0901
+ throughput/total_tokens=2,027,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10559/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,027,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10560/500000]
+ optim/total_grad_norm=0.8659
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=2,027,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10561/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,027,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10562/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=2,027,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10563/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,028,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10564/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,028,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10565/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=2,028,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10566/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=2,028,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10567/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=2,028,864,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10568/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,029,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10569/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,029,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10570/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=2,029,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10571/500000]
+ train/ActionNoiseL2Loss=0.0995
+ throughput/total_tokens=2,029,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10572/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,029,824,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10573/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=2,030,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10574/500000]
+ train/ActionNoiseL2Loss=0.0732
+ throughput/total_tokens=2,030,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10575/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=2,030,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10576/500000]
+ train/ActionNoiseL2Loss=0.0843
+ throughput/total_tokens=2,030,592,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10577/500000]
+ train/ActionNoiseL2Loss=0.1337
+ throughput/total_tokens=2,030,784,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10578/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,030,976,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10579/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=2,031,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10580/500000]
+ optim/total_grad_norm=0.6415
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,031,360,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10581/500000]
+ train/ActionNoiseL2Loss=0.0902
+ throughput/total_tokens=2,031,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10582/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=2,031,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10583/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=2,031,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10584/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=2,032,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10585/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,032,320,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10586/500000]
+ train/ActionNoiseL2Loss=0.0780
+ throughput/total_tokens=2,032,512,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10587/500000]
+ train/ActionNoiseL2Loss=0.0791
+ throughput/total_tokens=2,032,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10588/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,032,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10589/500000]
+ train/ActionNoiseL2Loss=0.0999
+ throughput/total_tokens=2,033,088,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10590/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,033,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10591/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,033,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10592/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,033,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10593/500000]
+ train/ActionNoiseL2Loss=0.1658
+ throughput/total_tokens=2,033,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10594/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=2,034,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10595/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=2,034,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10596/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,034,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10597/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=2,034,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10598/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=2,034,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10599/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=2,035,008,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10600/500000]
+ optim/total_grad_norm=0.6812
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,035,200,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10601/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=2,035,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10602/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=2,035,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10603/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=2,035,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10604/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=2,035,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10605/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=2,036,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10606/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=2,036,352,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10607/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=2,036,544,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10608/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=2,036,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10609/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,036,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10610/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,037,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10611/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,037,312,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10612/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,037,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10613/500000]
+ train/ActionNoiseL2Loss=0.0991
+ throughput/total_tokens=2,037,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10614/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,037,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10615/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=2,038,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10616/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=2,038,272,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10617/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,038,464,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10618/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=2,038,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10619/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,038,848,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10620/500000]
+ optim/total_grad_norm=0.4737
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,039,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10621/500000]
+ train/ActionNoiseL2Loss=0.0355
+ throughput/total_tokens=2,039,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10622/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,039,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10623/500000]
+ train/ActionNoiseL2Loss=0.0827
+ throughput/total_tokens=2,039,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10624/500000]
+ train/ActionNoiseL2Loss=0.0893
+ throughput/total_tokens=2,039,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10625/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=2,040,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10626/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,040,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10627/500000]
+ train/ActionNoiseL2Loss=0.0832
+ throughput/total_tokens=2,040,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10628/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=2,040,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10629/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=2,040,768,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10630/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=2,040,960,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10631/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,041,152,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10632/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=2,041,344,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10633/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,041,536,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10634/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,041,728,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10635/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,041,920,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10636/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=2,042,112,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10637/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=2,042,304,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10638/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,042,496,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10639/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,042,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10640/500000]
+ optim/total_grad_norm=0.7025
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,042,880,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10641/500000]
+ train/ActionNoiseL2Loss=0.0299
+ throughput/total_tokens=2,043,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10642/500000]
+ train/ActionNoiseL2Loss=0.0283
+ throughput/total_tokens=2,043,264,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10643/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,043,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10644/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,043,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10645/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,043,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10646/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,044,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10647/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,044,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10648/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=2,044,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10649/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,044,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10650/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,044,800,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10651/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=2,044,992,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10652/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,045,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10653/500000]
+ train/ActionNoiseL2Loss=0.0558
+ throughput/total_tokens=2,045,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10654/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=2,045,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10655/500000]
+ train/ActionNoiseL2Loss=0.0275
+ throughput/total_tokens=2,045,760,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10656/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,045,952,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10657/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,046,144,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10658/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=2,046,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10659/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=2,046,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10660/500000]
+ optim/total_grad_norm=0.3899
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=2,046,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10661/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=2,046,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10662/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=2,047,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10663/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=2,047,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10664/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=2,047,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10665/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=2,047,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10666/500000]
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=2,047,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10667/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,048,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10668/500000]
+ train/ActionNoiseL2Loss=0.0285
+ throughput/total_tokens=2,048,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10669/500000]
+ train/ActionNoiseL2Loss=0.0265
+ throughput/total_tokens=2,048,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10670/500000]
+ train/ActionNoiseL2Loss=0.0820
+ throughput/total_tokens=2,048,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10671/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=2,048,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10672/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=2,049,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10673/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=2,049,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10674/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=2,049,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10675/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,049,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10676/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=2,049,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10677/500000]
+ train/ActionNoiseL2Loss=0.0815
+ throughput/total_tokens=2,049,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10678/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,050,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10679/500000]
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,050,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10680/500000]
+ optim/total_grad_norm=1.082
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=2,050,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10681/500000]
+ train/ActionNoiseL2Loss=0.1055
+ throughput/total_tokens=2,050,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10682/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=2,050,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10683/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=2,051,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10684/500000]
+ train/ActionNoiseL2Loss=0.0879
+ throughput/total_tokens=2,051,328,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10685/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,051,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10686/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,051,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10687/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=2,051,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10688/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,052,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10689/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=2,052,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10690/500000]
+ train/ActionNoiseL2Loss=0.0632
+ throughput/total_tokens=2,052,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10691/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,052,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10692/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=2,052,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10693/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,053,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10694/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,053,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10695/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,053,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10696/500000]
+ train/ActionNoiseL2Loss=0.0616
+ throughput/total_tokens=2,053,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10697/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,053,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10698/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,054,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10699/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,054,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10700/500000]
+ optim/total_grad_norm=0.4017
+ train/ActionNoiseL2Loss=0.0837
+ throughput/total_tokens=2,054,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10701/500000]
+ train/ActionNoiseL2Loss=0.0405
+ throughput/total_tokens=2,054,592,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10702/500000]
+ train/ActionNoiseL2Loss=0.0781
+ throughput/total_tokens=2,054,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10703/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=2,054,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10704/500000]
+ train/ActionNoiseL2Loss=0.0673
+ throughput/total_tokens=2,055,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10705/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,055,360,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10706/500000]
+ train/ActionNoiseL2Loss=0.0421
+ throughput/total_tokens=2,055,552,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10707/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,055,744,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10708/500000]
+ train/ActionNoiseL2Loss=0.0602
+ throughput/total_tokens=2,055,936,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10709/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,056,128,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10710/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=2,056,320,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=10711/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=2,056,512,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10712/500000]
+ train/ActionNoiseL2Loss=0.1003
+ throughput/total_tokens=2,056,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10713/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=2,056,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10714/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,057,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10715/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,057,280,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10716/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=2,057,472,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10717/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=2,057,664,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10718/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=2,057,856,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10719/500000]
+ train/ActionNoiseL2Loss=0.0864
+ throughput/total_tokens=2,058,048,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=10720/500000]
+ optim/total_grad_norm=0.6584
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,058,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10721/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,058,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10722/500000]
+ train/ActionNoiseL2Loss=0.0911
+ throughput/total_tokens=2,058,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10723/500000]
+ train/ActionNoiseL2Loss=0.1392
+ throughput/total_tokens=2,058,816,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10724/500000]
+ train/ActionNoiseL2Loss=0.0805
+ throughput/total_tokens=2,059,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10725/500000]
+ train/ActionNoiseL2Loss=0.0743
+ throughput/total_tokens=2,059,200,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10726/500000]
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,059,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10727/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,059,584,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10728/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=2,059,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10729/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=2,059,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10730/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,060,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10731/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,060,352,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10732/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=2,060,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10733/500000]
+ train/ActionNoiseL2Loss=0.0363
+ throughput/total_tokens=2,060,736,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10734/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=2,060,928,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10735/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=2,061,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10736/500000]
+ train/ActionNoiseL2Loss=0.0795
+ throughput/total_tokens=2,061,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10737/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=2,061,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10738/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=2,061,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10739/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=2,061,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10740/500000]
+ optim/total_grad_norm=0.7799
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=2,062,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10741/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,062,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10742/500000]
+ train/ActionNoiseL2Loss=0.0862
+ throughput/total_tokens=2,062,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10743/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,062,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10744/500000]
+ train/ActionNoiseL2Loss=0.0280
+ throughput/total_tokens=2,062,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10745/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=2,063,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10746/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,063,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10747/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=2,063,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10748/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=2,063,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10749/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,063,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10750/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=2,064,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10751/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=2,064,192,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10752/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=2,064,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10753/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=2,064,576,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10754/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=2,064,768,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10755/500000]
+ train/ActionNoiseL2Loss=0.0942
+ throughput/total_tokens=2,064,960,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=10756/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,065,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10757/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=2,065,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10758/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,065,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10759/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=2,065,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10760/500000]
+ optim/total_grad_norm=1.360
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=2,065,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10761/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=2,066,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10762/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,066,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10763/500000]
+ train/ActionNoiseL2Loss=0.0316
+ throughput/total_tokens=2,066,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10764/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=2,066,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10765/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=2,066,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10766/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=2,067,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10767/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,067,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10768/500000]
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=2,067,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10769/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,067,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10770/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=2,067,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10771/500000]
+ train/ActionNoiseL2Loss=0.0706
+ throughput/total_tokens=2,068,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10772/500000]
+ train/ActionNoiseL2Loss=0.0918
+ throughput/total_tokens=2,068,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10773/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=2,068,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10774/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,068,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10775/500000]
+ train/ActionNoiseL2Loss=0.0852
+ throughput/total_tokens=2,068,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10776/500000]
+ train/ActionNoiseL2Loss=0.0714
+ throughput/total_tokens=2,068,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10777/500000]
+ train/ActionNoiseL2Loss=0.0155
+ throughput/total_tokens=2,069,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10778/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=2,069,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10779/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=2,069,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10780/500000]
+ optim/total_grad_norm=0.5132
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,069,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10781/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,069,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10782/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=2,070,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10783/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,070,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10784/500000]
+ train/ActionNoiseL2Loss=0.0788
+ throughput/total_tokens=2,070,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10785/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,070,720,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10786/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,070,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10787/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,071,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10788/500000]
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,071,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10789/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,071,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10790/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,071,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10791/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,071,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10792/500000]
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=2,072,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10793/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=2,072,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10794/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=2,072,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10795/500000]
+ train/ActionNoiseL2Loss=0.0650
+ throughput/total_tokens=2,072,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10796/500000]
+ train/ActionNoiseL2Loss=0.0985
+ throughput/total_tokens=2,072,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10797/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,073,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10798/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=2,073,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10799/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=2,073,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10800/500000]
+ optim/total_grad_norm=0.6757
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=2,073,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10801/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=2,073,792,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10802/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,073,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10803/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,074,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10804/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=2,074,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10805/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=2,074,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10806/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=2,074,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10807/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,074,944,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10808/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,075,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10809/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,075,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10810/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,075,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10811/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,075,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10812/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,075,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10813/500000]
+ train/ActionNoiseL2Loss=0.0249
+ throughput/total_tokens=2,076,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10814/500000]
+ train/ActionNoiseL2Loss=0.0856
+ throughput/total_tokens=2,076,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10815/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,076,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10816/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=2,076,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10817/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,076,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10818/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,077,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10819/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,077,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10820/500000]
+ optim/total_grad_norm=0.7374
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=2,077,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10821/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=2,077,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10822/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,077,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10823/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=2,078,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10824/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,078,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10825/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=2,078,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10826/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,078,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10827/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=2,078,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10828/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,078,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10829/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,079,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10830/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=2,079,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10831/500000]
+ train/ActionNoiseL2Loss=0.0393
+ throughput/total_tokens=2,079,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10832/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=2,079,744,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10833/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,079,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10834/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,080,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10835/500000]
+ train/ActionNoiseL2Loss=0.0787
+ throughput/total_tokens=2,080,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10836/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=2,080,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10837/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=2,080,704,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10838/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,080,896,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10839/500000]
+ train/ActionNoiseL2Loss=0.0873
+ throughput/total_tokens=2,081,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10840/500000]
+ optim/total_grad_norm=0.7783
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,081,280,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10841/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=2,081,472,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10842/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,081,664,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10843/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=2,081,856,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10844/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=2,082,048,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10845/500000]
+ train/ActionNoiseL2Loss=0.0769
+ throughput/total_tokens=2,082,240,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10846/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,082,432,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10847/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,082,624,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10848/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,082,816,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10849/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,083,008,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10850/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,083,200,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10851/500000]
+ train/ActionNoiseL2Loss=0.0930
+ throughput/total_tokens=2,083,392,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=10852/500000]
+ train/ActionNoiseL2Loss=0.0811
+ throughput/total_tokens=2,083,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10853/500000]
+ train/ActionNoiseL2Loss=0.0713
+ throughput/total_tokens=2,083,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10854/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,083,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10855/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,084,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10856/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,084,352,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10857/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=2,084,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10858/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=2,084,736,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10859/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,084,928,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10860/500000]
+ optim/total_grad_norm=0.9259
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=2,085,120,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10861/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=2,085,312,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10862/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,085,504,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10863/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,085,696,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10864/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,085,888,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10865/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,086,080,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10866/500000]
+ train/ActionNoiseL2Loss=0.0874
+ throughput/total_tokens=2,086,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10867/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,086,464,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10868/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=2,086,656,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10869/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=2,086,848,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10870/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,087,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10871/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=2,087,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10872/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,087,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10873/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=2,087,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10874/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,087,808,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10875/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=2,088,000,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10876/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=2,088,192,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10877/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=2,088,384,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10878/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,088,576,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10879/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,088,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10880/500000]
+ optim/total_grad_norm=0.5586
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,088,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10881/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=2,089,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10882/500000]
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=2,089,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10883/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,089,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10884/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=2,089,728,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10885/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=2,089,920,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10886/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,090,112,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10887/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=2,090,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10888/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=2,090,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10889/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=2,090,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10890/500000]
+ train/ActionNoiseL2Loss=0.0560
+ throughput/total_tokens=2,090,880,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10891/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,091,072,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10892/500000]
+ train/ActionNoiseL2Loss=0.0826
+ throughput/total_tokens=2,091,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10893/500000]
+ train/ActionNoiseL2Loss=0.0676
+ throughput/total_tokens=2,091,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10894/500000]
+ train/ActionNoiseL2Loss=0.0659
+ throughput/total_tokens=2,091,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10895/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=2,091,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10896/500000]
+ train/ActionNoiseL2Loss=0.0638
+ throughput/total_tokens=2,092,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10897/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=2,092,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10898/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,092,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10899/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,092,608,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10900/500000]
+ optim/total_grad_norm=0.9346
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=2,092,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10901/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,092,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10902/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,093,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10903/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,093,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10904/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=2,093,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10905/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=2,093,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10906/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,093,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10907/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=2,094,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10908/500000]
+ train/ActionNoiseL2Loss=0.0680
+ throughput/total_tokens=2,094,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10909/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,094,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10910/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=2,094,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=10911/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=2,094,912,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=10912/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,095,104,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10913/500000]
+ train/ActionNoiseL2Loss=0.0761
+ throughput/total_tokens=2,095,296,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10914/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=2,095,488,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10915/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=2,095,680,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10916/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,095,872,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10917/500000]
+ train/ActionNoiseL2Loss=0.0736
+ throughput/total_tokens=2,096,064,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10918/500000]
+ train/ActionNoiseL2Loss=0.0770
+ throughput/total_tokens=2,096,256,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10919/500000]
+ train/ActionNoiseL2Loss=0.0277
+ throughput/total_tokens=2,096,448,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=10920/500000]
+ optim/total_grad_norm=0.9540
+ train/ActionNoiseL2Loss=0.0575
+ throughput/total_tokens=2,096,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10921/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=2,096,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10922/500000]
+ train/ActionNoiseL2Loss=0.0241
+ throughput/total_tokens=2,097,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10923/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,097,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10924/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=2,097,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10925/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=2,097,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10926/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=2,097,792,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10927/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=2,097,984,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10928/500000]
+ train/ActionNoiseL2Loss=0.0481
+ throughput/total_tokens=2,098,176,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10929/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=2,098,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10930/500000]
+ train/ActionNoiseL2Loss=0.0629
+ throughput/total_tokens=2,098,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10931/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,098,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10932/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,098,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10933/500000]
+ train/ActionNoiseL2Loss=0.0202
+ throughput/total_tokens=2,099,136,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10934/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,099,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10935/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,099,520,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10936/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=2,099,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10937/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,099,904,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10938/500000]
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=2,100,096,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10939/500000]
+ train/ActionNoiseL2Loss=0.0803
+ throughput/total_tokens=2,100,288,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10940/500000]
+ optim/total_grad_norm=0.6888
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,100,480,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10941/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=2,100,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10942/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,100,864,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10943/500000]
+ train/ActionNoiseL2Loss=0.1016
+ throughput/total_tokens=2,101,056,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10944/500000]
+ train/ActionNoiseL2Loss=0.0943
+ throughput/total_tokens=2,101,248,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10945/500000]
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,101,440,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10946/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=2,101,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10947/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=2,101,824,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=10948/500000]
+ train/ActionNoiseL2Loss=0.0715
+ throughput/total_tokens=2,102,016,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10949/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=2,102,208,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=10950/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,102,400,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=10951/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=2,102,592,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10952/500000]
+ train/ActionNoiseL2Loss=0.0750
+ throughput/total_tokens=2,102,784,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10953/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,102,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10954/500000]
+ train/ActionNoiseL2Loss=0.0661
+ throughput/total_tokens=2,103,168,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10955/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=2,103,360,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10956/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,103,552,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10957/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,103,744,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10958/500000]
+ train/ActionNoiseL2Loss=0.0584
+ throughput/total_tokens=2,103,936,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10959/500000]
+ train/ActionNoiseL2Loss=0.0489
+ throughput/total_tokens=2,104,128,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10960/500000]
+ optim/total_grad_norm=1.008
+ train/ActionNoiseL2Loss=0.0936
+ throughput/total_tokens=2,104,320,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=10961/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,104,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10962/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=2,104,704,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10963/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=2,104,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10964/500000]
+ train/ActionNoiseL2Loss=0.0589
+ throughput/total_tokens=2,105,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=10965/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=2,105,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10966/500000]
+ train/ActionNoiseL2Loss=0.0332
+ throughput/total_tokens=2,105,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10967/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=2,105,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10968/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,105,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10969/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=2,106,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=10970/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=2,106,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10971/500000]
+ train/ActionNoiseL2Loss=0.0343
+ throughput/total_tokens=2,106,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10972/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=2,106,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10973/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=2,106,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10974/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=2,107,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10975/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,107,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10976/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=2,107,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10977/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=2,107,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10978/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,107,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10979/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=2,107,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10980/500000]
+ optim/total_grad_norm=0.9047
+ train/ActionNoiseL2Loss=0.0872
+ throughput/total_tokens=2,108,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10981/500000]
+ train/ActionNoiseL2Loss=0.0525
+ throughput/total_tokens=2,108,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10982/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=2,108,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=10983/500000]
+ train/ActionNoiseL2Loss=0.1235
+ throughput/total_tokens=2,108,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10984/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,108,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10985/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,109,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10986/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,109,312,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10987/500000]
+ train/ActionNoiseL2Loss=0.0220
+ throughput/total_tokens=2,109,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10988/500000]
+ train/ActionNoiseL2Loss=0.1254
+ throughput/total_tokens=2,109,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10989/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=2,109,888,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10990/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,110,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=10991/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=2,110,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10992/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,110,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10993/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,110,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10994/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=2,110,848,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=10995/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=2,111,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10996/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,111,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10997/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=2,111,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10998/500000]
+ train/ActionNoiseL2Loss=0.1010
+ throughput/total_tokens=2,111,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=10999/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,111,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11000/500000]
+ optim/total_grad_norm=0.6873
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=2,112,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/14 [10:09:09] INFO | >> Saving config... checkpoint.py:608
+10/14 [10:09:41] INFO | >> Saving model state... checkpoint.py:796
+10/14 [10:11:01] INFO | >> Saving optim state... checkpoint.py:811
+10/14 [10:12:32] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11001/500000]
+ train/ActionNoiseL2Loss=0.1262
+ throughput/total_tokens=2,112,192,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11002/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,112,384,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=11003/500000]
+ train/ActionNoiseL2Loss=0.0921
+ throughput/total_tokens=2,112,576,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=11004/500000]
+ train/ActionNoiseL2Loss=0.0891
+ throughput/total_tokens=2,112,768,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=11005/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,112,960,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=11006/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,113,152,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11007/500000]
+ train/ActionNoiseL2Loss=0.0424
+ throughput/total_tokens=2,113,344,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11008/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,113,536,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11009/500000]
+ train/ActionNoiseL2Loss=0.0674
+ throughput/total_tokens=2,113,728,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11010/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=2,113,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=11011/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=2,114,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11012/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=2,114,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11013/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=2,114,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11014/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=2,114,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11015/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=2,114,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11016/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,115,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11017/500000]
+ train/ActionNoiseL2Loss=0.0802
+ throughput/total_tokens=2,115,264,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11018/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=2,115,456,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11019/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=2,115,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11020/500000]
+ optim/total_grad_norm=0.6809
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,115,840,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11021/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,116,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11022/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=2,116,224,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11023/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,116,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11024/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,116,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11025/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,116,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11026/500000]
+ train/ActionNoiseL2Loss=0.0364
+ throughput/total_tokens=2,116,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11027/500000]
+ train/ActionNoiseL2Loss=0.0323
+ throughput/total_tokens=2,117,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11028/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=2,117,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11029/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=2,117,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11030/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=2,117,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11031/500000]
+ train/ActionNoiseL2Loss=0.0245
+ throughput/total_tokens=2,117,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11032/500000]
+ train/ActionNoiseL2Loss=0.0701
+ throughput/total_tokens=2,118,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11033/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,118,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11034/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,118,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11035/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=2,118,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11036/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,118,912,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11037/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,119,104,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11038/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,119,296,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11039/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,119,488,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11040/500000]
+ optim/total_grad_norm=0.4578
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,119,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11041/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,119,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11042/500000]
+ train/ActionNoiseL2Loss=0.0599
+ throughput/total_tokens=2,120,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11043/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,120,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11044/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=2,120,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11045/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=2,120,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11046/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,120,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11047/500000]
+ train/ActionNoiseL2Loss=0.1062
+ throughput/total_tokens=2,121,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11048/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,121,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11049/500000]
+ train/ActionNoiseL2Loss=0.0585
+ throughput/total_tokens=2,121,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11050/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=2,121,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=11051/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=2,121,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11052/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,121,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11053/500000]
+ train/ActionNoiseL2Loss=0.0259
+ throughput/total_tokens=2,122,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11054/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=2,122,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11055/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=2,122,560,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11056/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=2,122,752,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11057/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=2,122,944,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11058/500000]
+ train/ActionNoiseL2Loss=0.1052
+ throughput/total_tokens=2,123,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11059/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=2,123,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11060/500000]
+ optim/total_grad_norm=0.5472
+ train/ActionNoiseL2Loss=0.0233
+ throughput/total_tokens=2,123,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11061/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,123,712,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11062/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,123,904,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11063/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,124,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11064/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=2,124,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11065/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,124,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11066/500000]
+ train/ActionNoiseL2Loss=0.0925
+ throughput/total_tokens=2,124,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11067/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=2,124,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11068/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=2,125,056,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11069/500000]
+ train/ActionNoiseL2Loss=0.1134
+ throughput/total_tokens=2,125,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11070/500000]
+ train/ActionNoiseL2Loss=0.1141
+ throughput/total_tokens=2,125,440,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=11071/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,125,632,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11072/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,125,824,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11073/500000]
+ train/ActionNoiseL2Loss=0.0619
+ throughput/total_tokens=2,126,016,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11074/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=2,126,208,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11075/500000]
+ train/ActionNoiseL2Loss=0.0360
+ throughput/total_tokens=2,126,400,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11076/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=2,126,592,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11077/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,126,784,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11078/500000]
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=2,126,976,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11079/500000]
+ train/ActionNoiseL2Loss=0.0292
+ throughput/total_tokens=2,127,168,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11080/500000]
+ optim/total_grad_norm=0.8678
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=2,127,360,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=11081/500000]
+ train/ActionNoiseL2Loss=0.0342
+ throughput/total_tokens=2,127,552,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11082/500000]
+ train/ActionNoiseL2Loss=0.0604
+ throughput/total_tokens=2,127,744,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11083/500000]
+ train/ActionNoiseL2Loss=0.0586
+ throughput/total_tokens=2,127,936,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11084/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,128,128,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11085/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,128,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11086/500000]
+ train/ActionNoiseL2Loss=0.0849
+ throughput/total_tokens=2,128,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11087/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=2,128,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11088/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,128,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11089/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,129,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11090/500000]
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=2,129,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11091/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=2,129,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11092/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,129,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11093/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,129,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11094/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,130,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11095/500000]
+ train/ActionNoiseL2Loss=0.0222
+ throughput/total_tokens=2,130,240,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11096/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,130,432,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11097/500000]
+ train/ActionNoiseL2Loss=0.0543
+ throughput/total_tokens=2,130,624,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11098/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,130,816,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11099/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=2,131,008,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11100/500000]
+ optim/total_grad_norm=0.6873
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,131,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11101/500000]
+ train/ActionNoiseL2Loss=0.1302
+ throughput/total_tokens=2,131,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11102/500000]
+ train/ActionNoiseL2Loss=0.0696
+ throughput/total_tokens=2,131,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11103/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,131,776,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11104/500000]
+ train/ActionNoiseL2Loss=0.0809
+ throughput/total_tokens=2,131,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11105/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=2,132,160,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11106/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,132,352,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11107/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,132,544,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11108/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=2,132,736,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11109/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=2,132,928,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11110/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,133,120,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=11111/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=2,133,312,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11112/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=2,133,504,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11113/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=2,133,696,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11114/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=2,133,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11115/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,134,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11116/500000]
+ train/ActionNoiseL2Loss=0.0923
+ throughput/total_tokens=2,134,272,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11117/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,134,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11118/500000]
+ train/ActionNoiseL2Loss=0.0740
+ throughput/total_tokens=2,134,656,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11119/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=2,134,848,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11120/500000]
+ optim/total_grad_norm=0.8090
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,135,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11121/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=2,135,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11122/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,135,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11123/500000]
+ train/ActionNoiseL2Loss=0.0435
+ throughput/total_tokens=2,135,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11124/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=2,135,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11125/500000]
+ train/ActionNoiseL2Loss=0.0218
+ throughput/total_tokens=2,136,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11126/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,136,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11127/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,136,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11128/500000]
+ train/ActionNoiseL2Loss=0.0861
+ throughput/total_tokens=2,136,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11129/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,136,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11130/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,136,960,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11131/500000]
+ train/ActionNoiseL2Loss=0.0816
+ throughput/total_tokens=2,137,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11132/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,137,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11133/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,137,536,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11134/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,137,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11135/500000]
+ train/ActionNoiseL2Loss=0.0438
+ throughput/total_tokens=2,137,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11136/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=2,138,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11137/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=2,138,304,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11138/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,138,496,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11139/500000]
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=2,138,688,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11140/500000]
+ optim/total_grad_norm=0.8134
+ train/ActionNoiseL2Loss=0.0990
+ throughput/total_tokens=2,138,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11141/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,139,072,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11142/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=2,139,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11143/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,139,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11144/500000]
+ train/ActionNoiseL2Loss=0.0349
+ throughput/total_tokens=2,139,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11145/500000]
+ train/ActionNoiseL2Loss=0.0357
+ throughput/total_tokens=2,139,840,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11146/500000]
+ train/ActionNoiseL2Loss=0.0668
+ throughput/total_tokens=2,140,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11147/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,140,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11148/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,140,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11149/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,140,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11150/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,140,800,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11151/500000]
+ train/ActionNoiseL2Loss=0.0840
+ throughput/total_tokens=2,140,992,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11152/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=2,141,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11153/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,141,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11154/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=2,141,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11155/500000]
+ train/ActionNoiseL2Loss=0.0207
+ throughput/total_tokens=2,141,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11156/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,141,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11157/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,142,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11158/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=2,142,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11159/500000]
+ train/ActionNoiseL2Loss=0.0912
+ throughput/total_tokens=2,142,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11160/500000]
+ optim/total_grad_norm=0.6086
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,142,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11161/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,142,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11162/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,143,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11163/500000]
+ train/ActionNoiseL2Loss=0.0188
+ throughput/total_tokens=2,143,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11164/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=2,143,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11165/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,143,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11166/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=2,143,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11167/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,144,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11168/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,144,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11169/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,144,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11170/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=2,144,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11171/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,144,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11172/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,145,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11173/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=2,145,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11174/500000]
+ train/ActionNoiseL2Loss=0.0710
+ throughput/total_tokens=2,145,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11175/500000]
+ train/ActionNoiseL2Loss=0.0461
+ throughput/total_tokens=2,145,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11176/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=2,145,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11177/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,145,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11178/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=2,146,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11179/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,146,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11180/500000]
+ optim/total_grad_norm=0.7078
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,146,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11181/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=2,146,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11182/500000]
+ train/ActionNoiseL2Loss=0.0442
+ throughput/total_tokens=2,146,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11183/500000]
+ train/ActionNoiseL2Loss=0.0970
+ throughput/total_tokens=2,147,136,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11184/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=2,147,328,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11185/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,147,520,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11186/500000]
+ train/ActionNoiseL2Loss=0.0536
+ throughput/total_tokens=2,147,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11187/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=2,147,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11188/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=2,148,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11189/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=2,148,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11190/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=2,148,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11191/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,148,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11192/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,148,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11193/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=2,149,056,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11194/500000]
+ train/ActionNoiseL2Loss=0.0932
+ throughput/total_tokens=2,149,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11195/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,149,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11196/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,149,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11197/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,149,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11198/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=2,150,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11199/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=2,150,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11200/500000]
+ optim/total_grad_norm=0.5690
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,150,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11201/500000]
+ train/ActionNoiseL2Loss=0.0244
+ throughput/total_tokens=2,150,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11202/500000]
+ train/ActionNoiseL2Loss=0.0550
+ throughput/total_tokens=2,150,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11203/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=2,150,976,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11204/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=2,151,168,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11205/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=2,151,360,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11206/500000]
+ train/ActionNoiseL2Loss=0.1380
+ throughput/total_tokens=2,151,552,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11207/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,151,744,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11208/500000]
+ train/ActionNoiseL2Loss=0.0301
+ throughput/total_tokens=2,151,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11209/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=2,152,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11210/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,152,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11211/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=2,152,512,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11212/500000]
+ train/ActionNoiseL2Loss=0.0193
+ throughput/total_tokens=2,152,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11213/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=2,152,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11214/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=2,153,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11215/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=2,153,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11216/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=2,153,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11217/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,153,664,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11218/500000]
+ train/ActionNoiseL2Loss=0.0926
+ throughput/total_tokens=2,153,856,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11219/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,154,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11220/500000]
+ optim/total_grad_norm=0.9380
+ train/ActionNoiseL2Loss=0.0546
+ throughput/total_tokens=2,154,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11221/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=2,154,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11222/500000]
+ train/ActionNoiseL2Loss=0.0692
+ throughput/total_tokens=2,154,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11223/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,154,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11224/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,155,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11225/500000]
+ train/ActionNoiseL2Loss=0.0789
+ throughput/total_tokens=2,155,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11226/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=2,155,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11227/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=2,155,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11228/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=2,155,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11229/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,155,968,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11230/500000]
+ train/ActionNoiseL2Loss=0.1080
+ throughput/total_tokens=2,156,160,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11231/500000]
+ train/ActionNoiseL2Loss=0.0223
+ throughput/total_tokens=2,156,352,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11232/500000]
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=2,156,544,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11233/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=2,156,736,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11234/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=2,156,928,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11235/500000]
+ train/ActionNoiseL2Loss=0.0314
+ throughput/total_tokens=2,157,120,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11236/500000]
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,157,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11237/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,157,504,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11238/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,157,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11239/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=2,157,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11240/500000]
+ optim/total_grad_norm=0.7354
+ train/ActionNoiseL2Loss=0.0682
+ throughput/total_tokens=2,158,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=11241/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,158,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11242/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,158,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11243/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=2,158,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11244/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,158,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11245/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,159,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11246/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,159,232,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11247/500000]
+ train/ActionNoiseL2Loss=0.0201
+ throughput/total_tokens=2,159,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11248/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=2,159,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11249/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,159,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11250/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=2,160,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11251/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=2,160,192,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11252/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=2,160,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11253/500000]
+ train/ActionNoiseL2Loss=0.0490
+ throughput/total_tokens=2,160,576,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11254/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=2,160,768,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11255/500000]
+ train/ActionNoiseL2Loss=0.0366
+ throughput/total_tokens=2,160,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11256/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,161,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11257/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,161,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11258/500000]
+ train/ActionNoiseL2Loss=0.1098
+ throughput/total_tokens=2,161,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11259/500000]
+ train/ActionNoiseL2Loss=0.0847
+ throughput/total_tokens=2,161,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11260/500000]
+ optim/total_grad_norm=0.5250
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,161,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11261/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=2,162,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11262/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,162,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11263/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,162,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11264/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,162,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11265/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=2,162,880,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11266/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,163,072,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11267/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,163,264,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11268/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,163,456,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11269/500000]
+ train/ActionNoiseL2Loss=0.0919
+ throughput/total_tokens=2,163,648,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11270/500000]
+ train/ActionNoiseL2Loss=0.0882
+ throughput/total_tokens=2,163,840,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11271/500000]
+ train/ActionNoiseL2Loss=0.1129
+ throughput/total_tokens=2,164,032,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11272/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=2,164,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11273/500000]
+ train/ActionNoiseL2Loss=0.0279
+ throughput/total_tokens=2,164,416,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11274/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,164,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11275/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=2,164,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11276/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=2,164,992,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11277/500000]
+ train/ActionNoiseL2Loss=0.0420
+ throughput/total_tokens=2,165,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11278/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,165,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11279/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,165,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11280/500000]
+ optim/total_grad_norm=0.5810
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=2,165,760,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11281/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=2,165,952,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11282/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=2,166,144,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11283/500000]
+ train/ActionNoiseL2Loss=0.0422
+ throughput/total_tokens=2,166,336,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11284/500000]
+ train/ActionNoiseL2Loss=0.0734
+ throughput/total_tokens=2,166,528,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11285/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,166,720,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11286/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=2,166,912,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11287/500000]
+ train/ActionNoiseL2Loss=0.0683
+ throughput/total_tokens=2,167,104,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11288/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=2,167,296,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11289/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=2,167,488,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11290/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=2,167,680,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=11291/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,167,872,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11292/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=2,168,064,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11293/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,168,256,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11294/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,168,448,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11295/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,168,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11296/500000]
+ train/ActionNoiseL2Loss=0.0310
+ throughput/total_tokens=2,168,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11297/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=2,169,024,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11298/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=2,169,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11299/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,169,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11300/500000]
+ optim/total_grad_norm=0.6158
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=2,169,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=11301/500000]
+ train/ActionNoiseL2Loss=0.0655
+ throughput/total_tokens=2,169,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11302/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=2,169,984,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11303/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,170,176,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11304/500000]
+ train/ActionNoiseL2Loss=0.0464
+ throughput/total_tokens=2,170,368,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11305/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=2,170,560,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11306/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=2,170,752,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11307/500000]
+ train/ActionNoiseL2Loss=0.0725
+ throughput/total_tokens=2,170,944,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11308/500000]
+ train/ActionNoiseL2Loss=0.0634
+ throughput/total_tokens=2,171,136,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11309/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,171,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11310/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,171,520,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11311/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,171,712,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11312/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=2,171,904,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11313/500000]
+ train/ActionNoiseL2Loss=0.0742
+ throughput/total_tokens=2,172,096,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11314/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=2,172,288,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11315/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=2,172,480,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11316/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=2,172,672,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11317/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=2,172,864,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11318/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=2,173,056,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11319/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=2,173,248,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11320/500000]
+ optim/total_grad_norm=0.7886
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=2,173,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11321/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,173,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11322/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,173,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11323/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,174,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11324/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=2,174,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11325/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=2,174,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11326/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,174,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11327/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=2,174,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11328/500000]
+ train/ActionNoiseL2Loss=0.1185
+ throughput/total_tokens=2,174,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11329/500000]
+ train/ActionNoiseL2Loss=0.0605
+ throughput/total_tokens=2,175,168,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11330/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,175,360,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11331/500000]
+ train/ActionNoiseL2Loss=0.0784
+ throughput/total_tokens=2,175,552,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11332/500000]
+ train/ActionNoiseL2Loss=0.0520
+ throughput/total_tokens=2,175,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11333/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=2,175,936,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11334/500000]
+ train/ActionNoiseL2Loss=0.0960
+ throughput/total_tokens=2,176,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11335/500000]
+ train/ActionNoiseL2Loss=0.0566
+ throughput/total_tokens=2,176,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11336/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,176,512,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11337/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,176,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11338/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,176,896,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11339/500000]
+ train/ActionNoiseL2Loss=0.0313
+ throughput/total_tokens=2,177,088,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11340/500000]
+ optim/total_grad_norm=0.7146
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,177,280,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11341/500000]
+ train/ActionNoiseL2Loss=0.0353
+ throughput/total_tokens=2,177,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11342/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,177,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11343/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,177,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11344/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=2,178,048,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11345/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=2,178,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11346/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=2,178,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11347/500000]
+ train/ActionNoiseL2Loss=0.0290
+ throughput/total_tokens=2,178,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11348/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,178,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11349/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,179,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11350/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,179,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11351/500000]
+ train/ActionNoiseL2Loss=0.0762
+ throughput/total_tokens=2,179,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11352/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=2,179,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11353/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,179,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11354/500000]
+ train/ActionNoiseL2Loss=0.0527
+ throughput/total_tokens=2,179,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11355/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,180,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11356/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,180,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11357/500000]
+ train/ActionNoiseL2Loss=0.0225
+ throughput/total_tokens=2,180,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11358/500000]
+ train/ActionNoiseL2Loss=0.0144
+ throughput/total_tokens=2,180,736,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11359/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=2,180,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11360/500000]
+ optim/total_grad_norm=1.240
+ train/ActionNoiseL2Loss=0.0910
+ throughput/total_tokens=2,181,120,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11361/500000]
+ train/ActionNoiseL2Loss=0.0870
+ throughput/total_tokens=2,181,312,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11362/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,181,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11363/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=2,181,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11364/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=2,181,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11365/500000]
+ train/ActionNoiseL2Loss=0.1056
+ throughput/total_tokens=2,182,080,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11366/500000]
+ train/ActionNoiseL2Loss=0.0522
+ throughput/total_tokens=2,182,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11367/500000]
+ train/ActionNoiseL2Loss=0.0633
+ throughput/total_tokens=2,182,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11368/500000]
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,182,656,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11369/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,182,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11370/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=2,183,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11371/500000]
+ train/ActionNoiseL2Loss=0.1039
+ throughput/total_tokens=2,183,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11372/500000]
+ train/ActionNoiseL2Loss=0.0523
+ throughput/total_tokens=2,183,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11373/500000]
+ train/ActionNoiseL2Loss=0.0535
+ throughput/total_tokens=2,183,616,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11374/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=2,183,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11375/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=2,184,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11376/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=2,184,192,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11377/500000]
+ train/ActionNoiseL2Loss=0.0248
+ throughput/total_tokens=2,184,384,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11378/500000]
+ train/ActionNoiseL2Loss=0.0399
+ throughput/total_tokens=2,184,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11379/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,184,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11380/500000]
+ optim/total_grad_norm=0.8142
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=2,184,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11381/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,185,152,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11382/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=2,185,344,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11383/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,185,536,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11384/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=2,185,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11385/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=2,185,920,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11386/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,186,112,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11387/500000]
+ train/ActionNoiseL2Loss=0.1041
+ throughput/total_tokens=2,186,304,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11388/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,186,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11389/500000]
+ train/ActionNoiseL2Loss=0.0764
+ throughput/total_tokens=2,186,688,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11390/500000]
+ train/ActionNoiseL2Loss=0.0749
+ throughput/total_tokens=2,186,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11391/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=2,187,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11392/500000]
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=2,187,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11393/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=2,187,456,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11394/500000]
+ train/ActionNoiseL2Loss=0.0578
+ throughput/total_tokens=2,187,648,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11395/500000]
+ train/ActionNoiseL2Loss=0.1291
+ throughput/total_tokens=2,187,840,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11396/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,188,032,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11397/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,188,224,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11398/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=2,188,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11399/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=2,188,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11400/500000]
+ optim/total_grad_norm=0.7353
+ train/ActionNoiseL2Loss=0.0646
+ throughput/total_tokens=2,188,800,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=11401/500000]
+ train/ActionNoiseL2Loss=0.0338
+ throughput/total_tokens=2,188,992,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11402/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,189,184,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11403/500000]
+ train/ActionNoiseL2Loss=0.0741
+ throughput/total_tokens=2,189,376,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11404/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=2,189,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11405/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,189,760,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11406/500000]
+ train/ActionNoiseL2Loss=0.0651
+ throughput/total_tokens=2,189,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11407/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,190,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11408/500000]
+ train/ActionNoiseL2Loss=0.0665
+ throughput/total_tokens=2,190,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11409/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=2,190,528,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11410/500000]
+ train/ActionNoiseL2Loss=0.0851
+ throughput/total_tokens=2,190,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11411/500000]
+ train/ActionNoiseL2Loss=0.0365
+ throughput/total_tokens=2,190,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11412/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=2,191,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11413/500000]
+ train/ActionNoiseL2Loss=0.0330
+ throughput/total_tokens=2,191,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11414/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,191,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11415/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,191,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11416/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=2,191,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11417/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=2,192,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11418/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,192,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11419/500000]
+ train/ActionNoiseL2Loss=0.0450
+ throughput/total_tokens=2,192,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11420/500000]
+ optim/total_grad_norm=0.6467
+ train/ActionNoiseL2Loss=0.0771
+ throughput/total_tokens=2,192,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11421/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,192,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11422/500000]
+ train/ActionNoiseL2Loss=0.0454
+ throughput/total_tokens=2,193,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11423/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,193,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11424/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,193,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11425/500000]
+ train/ActionNoiseL2Loss=0.0721
+ throughput/total_tokens=2,193,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11426/500000]
+ train/ActionNoiseL2Loss=0.0565
+ throughput/total_tokens=2,193,792,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11427/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=2,193,984,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11428/500000]
+ train/ActionNoiseL2Loss=0.0657
+ throughput/total_tokens=2,194,176,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11429/500000]
+ train/ActionNoiseL2Loss=0.0724
+ throughput/total_tokens=2,194,368,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11430/500000]
+ train/ActionNoiseL2Loss=0.0544
+ throughput/total_tokens=2,194,560,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=11431/500000]
+ train/ActionNoiseL2Loss=0.0513
+ throughput/total_tokens=2,194,752,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11432/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,194,944,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11433/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,195,136,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11434/500000]
+ train/ActionNoiseL2Loss=0.0511
+ throughput/total_tokens=2,195,328,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11435/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,195,520,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11436/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=2,195,712,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11437/500000]
+ train/ActionNoiseL2Loss=0.0467
+ throughput/total_tokens=2,195,904,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11438/500000]
+ train/ActionNoiseL2Loss=0.0848
+ throughput/total_tokens=2,196,096,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11439/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,196,288,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11440/500000]
+ optim/total_grad_norm=0.7707
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=2,196,480,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=11441/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=2,196,672,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11442/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=2,196,864,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11443/500000]
+ train/ActionNoiseL2Loss=0.0496
+ throughput/total_tokens=2,197,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11444/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,197,248,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11445/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,197,440,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11446/500000]
+ train/ActionNoiseL2Loss=0.0326
+ throughput/total_tokens=2,197,632,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11447/500000]
+ train/ActionNoiseL2Loss=0.0524
+ throughput/total_tokens=2,197,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11448/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,198,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11449/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,198,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11450/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=2,198,400,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11451/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=2,198,592,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11452/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,198,784,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11453/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=2,198,976,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11454/500000]
+ train/ActionNoiseL2Loss=0.0397
+ throughput/total_tokens=2,199,168,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11455/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,199,360,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11456/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,199,552,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11457/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=2,199,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11458/500000]
+ train/ActionNoiseL2Loss=0.0897
+ throughput/total_tokens=2,199,936,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11459/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,200,128,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11460/500000]
+ optim/total_grad_norm=0.6441
+ train/ActionNoiseL2Loss=0.0389
+ throughput/total_tokens=2,200,320,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11461/500000]
+ train/ActionNoiseL2Loss=0.0601
+ throughput/total_tokens=2,200,512,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11462/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=2,200,704,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11463/500000]
+ train/ActionNoiseL2Loss=0.0548
+ throughput/total_tokens=2,200,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11464/500000]
+ train/ActionNoiseL2Loss=0.0320
+ throughput/total_tokens=2,201,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11465/500000]
+ train/ActionNoiseL2Loss=0.1203
+ throughput/total_tokens=2,201,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11466/500000]
+ train/ActionNoiseL2Loss=0.0455
+ throughput/total_tokens=2,201,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11467/500000]
+ train/ActionNoiseL2Loss=0.0327
+ throughput/total_tokens=2,201,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11468/500000]
+ train/ActionNoiseL2Loss=0.0294
+ throughput/total_tokens=2,201,856,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11469/500000]
+ train/ActionNoiseL2Loss=0.0574
+ throughput/total_tokens=2,202,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11470/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,202,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11471/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,202,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11472/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=2,202,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11473/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,202,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11474/500000]
+ train/ActionNoiseL2Loss=0.0829
+ throughput/total_tokens=2,203,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11475/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=2,203,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11476/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=2,203,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11477/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,203,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11478/500000]
+ train/ActionNoiseL2Loss=0.0695
+ throughput/total_tokens=2,203,776,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11479/500000]
+ train/ActionNoiseL2Loss=0.0247
+ throughput/total_tokens=2,203,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11480/500000]
+ optim/total_grad_norm=0.5625
+ train/ActionNoiseL2Loss=0.0418
+ throughput/total_tokens=2,204,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11481/500000]
+ train/ActionNoiseL2Loss=0.0514
+ throughput/total_tokens=2,204,352,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11482/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,204,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11483/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,204,736,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11484/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,204,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11485/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,205,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11486/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=2,205,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11487/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,205,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11488/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=2,205,696,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11489/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,205,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11490/500000]
+ train/ActionNoiseL2Loss=0.0940
+ throughput/total_tokens=2,206,080,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11491/500000]
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=2,206,272,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11492/500000]
+ train/ActionNoiseL2Loss=0.1025
+ throughput/total_tokens=2,206,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11493/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=2,206,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11494/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,206,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11495/500000]
+ train/ActionNoiseL2Loss=0.0587
+ throughput/total_tokens=2,207,040,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11496/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=2,207,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11497/500000]
+ train/ActionNoiseL2Loss=0.0729
+ throughput/total_tokens=2,207,424,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11498/500000]
+ train/ActionNoiseL2Loss=0.0857
+ throughput/total_tokens=2,207,616,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11499/500000]
+ train/ActionNoiseL2Loss=0.0395
+ throughput/total_tokens=2,207,808,000
+ throughput/device/tokens_per_second=1,154
+ throughput/device/batches_per_second=0.0481
+[step=11500/500000]
+ optim/total_grad_norm=0.8561
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=2,208,000,000
+ throughput/device/tokens_per_second=1,155
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+10/14 [13:07:42] INFO | >> Saving config... checkpoint.py:608
+10/14 [13:08:19] INFO | >> Saving model state... checkpoint.py:796
+10/14 [13:09:30] INFO | >> Saving optim state... checkpoint.py:811
+10/14 [13:11:01] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=11501/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=2,208,192,000
+ throughput/device/tokens_per_second=1,131
+ throughput/device/batches_per_second=0.0472
+[step=11502/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=2,208,384,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=11503/500000]
+ train/ActionNoiseL2Loss=0.0552
+ throughput/total_tokens=2,208,576,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=11504/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,208,768,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0475
+[step=11505/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,208,960,000
+ throughput/device/tokens_per_second=1,142
+ throughput/device/batches_per_second=0.0476
+[step=11506/500000]
+ train/ActionNoiseL2Loss=0.0907
+ throughput/total_tokens=2,209,152,000
+ throughput/device/tokens_per_second=1,143
+ throughput/device/batches_per_second=0.0476
+[step=11507/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=2,209,344,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=11508/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=2,209,536,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=11509/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,209,728,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=11510/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,209,920,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=11511/500000]
+ train/ActionNoiseL2Loss=0.0281
+ throughput/total_tokens=2,210,112,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11512/500000]
+ train/ActionNoiseL2Loss=0.0702
+ throughput/total_tokens=2,210,304,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11513/500000]
+ train/ActionNoiseL2Loss=0.0498
+ throughput/total_tokens=2,210,496,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11514/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,210,688,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11515/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,210,880,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11516/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,211,072,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11517/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=2,211,264,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11518/500000]
+ train/ActionNoiseL2Loss=0.1048
+ throughput/total_tokens=2,211,456,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11519/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=2,211,648,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11520/500000]
+ optim/total_grad_norm=0.7132
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=2,211,840,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=11521/500000]
+ train/ActionNoiseL2Loss=0.0775
+ throughput/total_tokens=2,212,032,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11522/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,212,224,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11523/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=2,212,416,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11524/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=2,212,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11525/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=2,212,800,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11526/500000]
+ train/ActionNoiseL2Loss=0.0533
+ throughput/total_tokens=2,212,992,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11527/500000]
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,213,184,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11528/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=2,213,376,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11529/500000]
+ train/ActionNoiseL2Loss=0.0517
+ throughput/total_tokens=2,213,568,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11530/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=2,213,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11531/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,213,952,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11532/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,214,144,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11533/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,214,336,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11534/500000]
+ train/ActionNoiseL2Loss=0.0678
+ throughput/total_tokens=2,214,528,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11535/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,214,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11536/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,214,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11537/500000]
+ train/ActionNoiseL2Loss=0.0606
+ throughput/total_tokens=2,215,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11538/500000]
+ train/ActionNoiseL2Loss=0.0640
+ throughput/total_tokens=2,215,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11539/500000]
+ train/ActionNoiseL2Loss=0.0822
+ throughput/total_tokens=2,215,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11540/500000]
+ optim/total_grad_norm=0.5934
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=2,215,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11541/500000]
+ train/ActionNoiseL2Loss=0.0636
+ throughput/total_tokens=2,215,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11542/500000]
+ train/ActionNoiseL2Loss=0.0264
+ throughput/total_tokens=2,216,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11543/500000]
+ train/ActionNoiseL2Loss=0.0322
+ throughput/total_tokens=2,216,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11544/500000]
+ train/ActionNoiseL2Loss=0.0998
+ throughput/total_tokens=2,216,448,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11545/500000]
+ train/ActionNoiseL2Loss=0.0576
+ throughput/total_tokens=2,216,640,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11546/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=2,216,832,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11547/500000]
+ train/ActionNoiseL2Loss=0.0439
+ throughput/total_tokens=2,217,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11548/500000]
+ train/ActionNoiseL2Loss=0.0690
+ throughput/total_tokens=2,217,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11549/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,217,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11550/500000]
+ train/ActionNoiseL2Loss=0.0346
+ throughput/total_tokens=2,217,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11551/500000]
+ train/ActionNoiseL2Loss=0.0722
+ throughput/total_tokens=2,217,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11552/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=2,217,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11553/500000]
+ train/ActionNoiseL2Loss=0.0311
+ throughput/total_tokens=2,218,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11554/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,218,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11555/500000]
+ train/ActionNoiseL2Loss=0.0344
+ throughput/total_tokens=2,218,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11556/500000]
+ train/ActionNoiseL2Loss=0.0362
+ throughput/total_tokens=2,218,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11557/500000]
+ train/ActionNoiseL2Loss=0.0300
+ throughput/total_tokens=2,218,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11558/500000]
+ train/ActionNoiseL2Loss=0.0744
+ throughput/total_tokens=2,219,136,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11559/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=2,219,328,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11560/500000]
+ optim/total_grad_norm=0.5305
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,219,520,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=11561/500000]
+ train/ActionNoiseL2Loss=0.0500
+ throughput/total_tokens=2,219,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11562/500000]
+ train/ActionNoiseL2Loss=0.0720
+ throughput/total_tokens=2,219,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11563/500000]
+ train/ActionNoiseL2Loss=0.0869
+ throughput/total_tokens=2,220,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11564/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,220,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11565/500000]
+ train/ActionNoiseL2Loss=0.0711
+ throughput/total_tokens=2,220,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11566/500000]
+ train/ActionNoiseL2Loss=0.1051
+ throughput/total_tokens=2,220,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11567/500000]
+ train/ActionNoiseL2Loss=0.0859
+ throughput/total_tokens=2,220,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11568/500000]
+ train/ActionNoiseL2Loss=0.0630
+ throughput/total_tokens=2,221,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11569/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,221,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11570/500000]
+ train/ActionNoiseL2Loss=0.0374
+ throughput/total_tokens=2,221,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11571/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,221,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11572/500000]
+ train/ActionNoiseL2Loss=0.0663
+ throughput/total_tokens=2,221,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11573/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,222,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11574/500000]
+ train/ActionNoiseL2Loss=0.0401
+ throughput/total_tokens=2,222,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11575/500000]
+ train/ActionNoiseL2Loss=0.1038
+ throughput/total_tokens=2,222,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11576/500000]
+ train/ActionNoiseL2Loss=0.0436
+ throughput/total_tokens=2,222,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11577/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,222,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11578/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=2,222,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11579/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=2,223,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11580/500000]
+ optim/total_grad_norm=0.9549
+ train/ActionNoiseL2Loss=0.0325
+ throughput/total_tokens=2,223,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11581/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=2,223,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11582/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,223,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11583/500000]
+ train/ActionNoiseL2Loss=0.1014
+ throughput/total_tokens=2,223,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11584/500000]
+ train/ActionNoiseL2Loss=0.0540
+ throughput/total_tokens=2,224,128,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11585/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=2,224,320,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11586/500000]
+ train/ActionNoiseL2Loss=0.0592
+ throughput/total_tokens=2,224,512,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11587/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,224,704,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11588/500000]
+ train/ActionNoiseL2Loss=0.0383
+ throughput/total_tokens=2,224,896,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11589/500000]
+ train/ActionNoiseL2Loss=0.0266
+ throughput/total_tokens=2,225,088,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11590/500000]
+ train/ActionNoiseL2Loss=0.0986
+ throughput/total_tokens=2,225,280,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11591/500000]
+ train/ActionNoiseL2Loss=0.0387
+ throughput/total_tokens=2,225,472,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11592/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,225,664,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11593/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=2,225,856,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11594/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,226,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11595/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,226,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11596/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=2,226,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11597/500000]
+ train/ActionNoiseL2Loss=0.0251
+ throughput/total_tokens=2,226,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11598/500000]
+ train/ActionNoiseL2Loss=0.1383
+ throughput/total_tokens=2,226,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11599/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=2,227,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11600/500000]
+ optim/total_grad_norm=0.9464
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,227,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11601/500000]
+ train/ActionNoiseL2Loss=0.0579
+ throughput/total_tokens=2,227,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11602/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,227,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11603/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=2,227,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11604/500000]
+ train/ActionNoiseL2Loss=0.0621
+ throughput/total_tokens=2,227,968,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11605/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,228,160,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11606/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=2,228,352,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11607/500000]
+ train/ActionNoiseL2Loss=0.0272
+ throughput/total_tokens=2,228,544,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11608/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,228,736,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11609/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,228,928,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11610/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=2,229,120,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11611/500000]
+ train/ActionNoiseL2Loss=0.0615
+ throughput/total_tokens=2,229,312,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11612/500000]
+ train/ActionNoiseL2Loss=0.0417
+ throughput/total_tokens=2,229,504,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11613/500000]
+ train/ActionNoiseL2Loss=0.0478
+ throughput/total_tokens=2,229,696,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11614/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=2,229,888,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11615/500000]
+ train/ActionNoiseL2Loss=0.0961
+ throughput/total_tokens=2,230,080,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11616/500000]
+ train/ActionNoiseL2Loss=0.0618
+ throughput/total_tokens=2,230,272,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11617/500000]
+ train/ActionNoiseL2Loss=0.0878
+ throughput/total_tokens=2,230,464,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11618/500000]
+ train/ActionNoiseL2Loss=0.0379
+ throughput/total_tokens=2,230,656,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11619/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=2,230,848,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11620/500000]
+ optim/total_grad_norm=0.7324
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,231,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11621/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,231,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11622/500000]
+ train/ActionNoiseL2Loss=0.0351
+ throughput/total_tokens=2,231,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11623/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=2,231,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11624/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=2,231,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11625/500000]
+ train/ActionNoiseL2Loss=0.0350
+ throughput/total_tokens=2,232,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11626/500000]
+ train/ActionNoiseL2Loss=0.0507
+ throughput/total_tokens=2,232,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11627/500000]
+ train/ActionNoiseL2Loss=0.0556
+ throughput/total_tokens=2,232,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11628/500000]
+ train/ActionNoiseL2Loss=0.0594
+ throughput/total_tokens=2,232,576,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11629/500000]
+ train/ActionNoiseL2Loss=0.0555
+ throughput/total_tokens=2,232,768,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11630/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,232,960,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11631/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,233,152,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11632/500000]
+ train/ActionNoiseL2Loss=0.0841
+ throughput/total_tokens=2,233,344,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11633/500000]
+ train/ActionNoiseL2Loss=0.0434
+ throughput/total_tokens=2,233,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11634/500000]
+ train/ActionNoiseL2Loss=0.0812
+ throughput/total_tokens=2,233,728,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11635/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,233,920,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11636/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,234,112,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11637/500000]
+ train/ActionNoiseL2Loss=0.0406
+ throughput/total_tokens=2,234,304,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11638/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=2,234,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11639/500000]
+ train/ActionNoiseL2Loss=0.1013
+ throughput/total_tokens=2,234,688,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11640/500000]
+ optim/total_grad_norm=0.9156
+ train/ActionNoiseL2Loss=0.0793
+ throughput/total_tokens=2,234,880,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11641/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=2,235,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11642/500000]
+ train/ActionNoiseL2Loss=0.0440
+ throughput/total_tokens=2,235,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11643/500000]
+ train/ActionNoiseL2Loss=0.0917
+ throughput/total_tokens=2,235,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11644/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,235,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11645/500000]
+ train/ActionNoiseL2Loss=0.0480
+ throughput/total_tokens=2,235,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11646/500000]
+ train/ActionNoiseL2Loss=0.0268
+ throughput/total_tokens=2,236,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11647/500000]
+ train/ActionNoiseL2Loss=0.0271
+ throughput/total_tokens=2,236,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11648/500000]
+ train/ActionNoiseL2Loss=0.0699
+ throughput/total_tokens=2,236,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11649/500000]
+ train/ActionNoiseL2Loss=0.1236
+ throughput/total_tokens=2,236,608,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11650/500000]
+ train/ActionNoiseL2Loss=0.0466
+ throughput/total_tokens=2,236,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11651/500000]
+ train/ActionNoiseL2Loss=0.0518
+ throughput/total_tokens=2,236,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11652/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=2,237,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11653/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=2,237,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11654/500000]
+ train/ActionNoiseL2Loss=0.0411
+ throughput/total_tokens=2,237,568,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11655/500000]
+ train/ActionNoiseL2Loss=0.0581
+ throughput/total_tokens=2,237,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11656/500000]
+ train/ActionNoiseL2Loss=0.0459
+ throughput/total_tokens=2,237,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11657/500000]
+ train/ActionNoiseL2Loss=0.1102
+ throughput/total_tokens=2,238,144,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11658/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,238,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11659/500000]
+ train/ActionNoiseL2Loss=0.0254
+ throughput/total_tokens=2,238,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11660/500000]
+ optim/total_grad_norm=1.159
+ train/ActionNoiseL2Loss=0.0978
+ throughput/total_tokens=2,238,720,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11661/500000]
+ train/ActionNoiseL2Loss=0.0938
+ throughput/total_tokens=2,238,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11662/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,239,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11663/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=2,239,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11664/500000]
+ train/ActionNoiseL2Loss=0.0839
+ throughput/total_tokens=2,239,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11665/500000]
+ train/ActionNoiseL2Loss=0.0506
+ throughput/total_tokens=2,239,680,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11666/500000]
+ train/ActionNoiseL2Loss=0.0712
+ throughput/total_tokens=2,239,872,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11667/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=2,240,064,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11668/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=2,240,256,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11669/500000]
+ train/ActionNoiseL2Loss=0.0561
+ throughput/total_tokens=2,240,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11670/500000]
+ train/ActionNoiseL2Loss=0.0888
+ throughput/total_tokens=2,240,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11671/500000]
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,240,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11672/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=2,241,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11673/500000]
+ train/ActionNoiseL2Loss=0.0352
+ throughput/total_tokens=2,241,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11674/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,241,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11675/500000]
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,241,600,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11676/500000]
+ train/ActionNoiseL2Loss=0.0239
+ throughput/total_tokens=2,241,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11677/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=2,241,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11678/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=2,242,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11679/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,242,368,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11680/500000]
+ optim/total_grad_norm=0.6256
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,242,560,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11681/500000]
+ train/ActionNoiseL2Loss=0.0647
+ throughput/total_tokens=2,242,752,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11682/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=2,242,944,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11683/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,243,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11684/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,243,328,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11685/500000]
+ train/ActionNoiseL2Loss=0.0767
+ throughput/total_tokens=2,243,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11686/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,243,712,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11687/500000]
+ train/ActionNoiseL2Loss=0.0613
+ throughput/total_tokens=2,243,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11688/500000]
+ train/ActionNoiseL2Loss=0.0453
+ throughput/total_tokens=2,244,096,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11689/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=2,244,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11690/500000]
+ train/ActionNoiseL2Loss=0.0704
+ throughput/total_tokens=2,244,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11691/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=2,244,672,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11692/500000]
+ train/ActionNoiseL2Loss=0.0321
+ throughput/total_tokens=2,244,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11693/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,245,056,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11694/500000]
+ train/ActionNoiseL2Loss=0.0853
+ throughput/total_tokens=2,245,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11695/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=2,245,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11696/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,245,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11697/500000]
+ train/ActionNoiseL2Loss=0.0376
+ throughput/total_tokens=2,245,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11698/500000]
+ train/ActionNoiseL2Loss=0.0627
+ throughput/total_tokens=2,246,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11699/500000]
+ train/ActionNoiseL2Loss=0.0382
+ throughput/total_tokens=2,246,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11700/500000]
+ optim/total_grad_norm=0.8363
+ train/ActionNoiseL2Loss=0.1058
+ throughput/total_tokens=2,246,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11701/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=2,246,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11702/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=2,246,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11703/500000]
+ train/ActionNoiseL2Loss=0.0303
+ throughput/total_tokens=2,246,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11704/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,247,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11705/500000]
+ train/ActionNoiseL2Loss=0.0335
+ throughput/total_tokens=2,247,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11706/500000]
+ train/ActionNoiseL2Loss=0.0818
+ throughput/total_tokens=2,247,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11707/500000]
+ train/ActionNoiseL2Loss=0.0250
+ throughput/total_tokens=2,247,744,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11708/500000]
+ train/ActionNoiseL2Loss=0.0573
+ throughput/total_tokens=2,247,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11709/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,248,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11710/500000]
+ train/ActionNoiseL2Loss=0.1175
+ throughput/total_tokens=2,248,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11711/500000]
+ train/ActionNoiseL2Loss=0.0483
+ throughput/total_tokens=2,248,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11712/500000]
+ train/ActionNoiseL2Loss=0.0880
+ throughput/total_tokens=2,248,704,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11713/500000]
+ train/ActionNoiseL2Loss=0.0278
+ throughput/total_tokens=2,248,896,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11714/500000]
+ train/ActionNoiseL2Loss=0.0929
+ throughput/total_tokens=2,249,088,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11715/500000]
+ train/ActionNoiseL2Loss=0.0385
+ throughput/total_tokens=2,249,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11716/500000]
+ train/ActionNoiseL2Loss=0.0134
+ throughput/total_tokens=2,249,472,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11717/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,249,664,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11718/500000]
+ train/ActionNoiseL2Loss=0.0580
+ throughput/total_tokens=2,249,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11719/500000]
+ train/ActionNoiseL2Loss=0.0470
+ throughput/total_tokens=2,250,048,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11720/500000]
+ optim/total_grad_norm=0.5982
+ train/ActionNoiseL2Loss=0.0745
+ throughput/total_tokens=2,250,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11721/500000]
+ train/ActionNoiseL2Loss=0.0475
+ throughput/total_tokens=2,250,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11722/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,250,624,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11723/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=2,250,816,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11724/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=2,251,008,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11725/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,251,200,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11726/500000]
+ train/ActionNoiseL2Loss=0.0821
+ throughput/total_tokens=2,251,392,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11727/500000]
+ train/ActionNoiseL2Loss=0.0484
+ throughput/total_tokens=2,251,584,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11728/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,251,776,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11729/500000]
+ train/ActionNoiseL2Loss=0.0739
+ throughput/total_tokens=2,251,968,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11730/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,252,160,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11731/500000]
+ train/ActionNoiseL2Loss=0.0625
+ throughput/total_tokens=2,252,352,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11732/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=2,252,544,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11733/500000]
+ train/ActionNoiseL2Loss=0.0412
+ throughput/total_tokens=2,252,736,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11734/500000]
+ train/ActionNoiseL2Loss=0.1060
+ throughput/total_tokens=2,252,928,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11735/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=2,253,120,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11736/500000]
+ train/ActionNoiseL2Loss=0.0549
+ throughput/total_tokens=2,253,312,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11737/500000]
+ train/ActionNoiseL2Loss=0.0380
+ throughput/total_tokens=2,253,504,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11738/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=2,253,696,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11739/500000]
+ train/ActionNoiseL2Loss=0.0603
+ throughput/total_tokens=2,253,888,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11740/500000]
+ optim/total_grad_norm=0.7577
+ train/ActionNoiseL2Loss=0.0396
+ throughput/total_tokens=2,254,080,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11741/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,254,272,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11742/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,254,464,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11743/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=2,254,656,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11744/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,254,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11745/500000]
+ train/ActionNoiseL2Loss=0.0752
+ throughput/total_tokens=2,255,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11746/500000]
+ train/ActionNoiseL2Loss=0.0486
+ throughput/total_tokens=2,255,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11747/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,255,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11748/500000]
+ train/ActionNoiseL2Loss=0.0675
+ throughput/total_tokens=2,255,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11749/500000]
+ train/ActionNoiseL2Loss=0.0801
+ throughput/total_tokens=2,255,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11750/500000]
+ train/ActionNoiseL2Loss=0.0465
+ throughput/total_tokens=2,256,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11751/500000]
+ train/ActionNoiseL2Loss=0.0324
+ throughput/total_tokens=2,256,192,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11752/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=2,256,384,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11753/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=2,256,576,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11754/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,256,768,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11755/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,256,960,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11756/500000]
+ train/ActionNoiseL2Loss=0.0491
+ throughput/total_tokens=2,257,152,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11757/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,257,344,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11758/500000]
+ train/ActionNoiseL2Loss=0.0635
+ throughput/total_tokens=2,257,536,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11759/500000]
+ train/ActionNoiseL2Loss=0.0336
+ throughput/total_tokens=2,257,728,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11760/500000]
+ optim/total_grad_norm=0.5202
+ train/ActionNoiseL2Loss=0.0554
+ throughput/total_tokens=2,257,920,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=11761/500000]
+ train/ActionNoiseL2Loss=0.0974
+ throughput/total_tokens=2,258,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11762/500000]
+ train/ActionNoiseL2Loss=0.0381
+ throughput/total_tokens=2,258,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11763/500000]
+ train/ActionNoiseL2Loss=0.0378
+ throughput/total_tokens=2,258,496,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11764/500000]
+ train/ActionNoiseL2Loss=0.0617
+ throughput/total_tokens=2,258,688,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11765/500000]
+ train/ActionNoiseL2Loss=0.0240
+ throughput/total_tokens=2,258,880,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11766/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=2,259,072,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11767/500000]
+ train/ActionNoiseL2Loss=0.0377
+ throughput/total_tokens=2,259,264,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11768/500000]
+ train/ActionNoiseL2Loss=0.0515
+ throughput/total_tokens=2,259,456,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11769/500000]
+ train/ActionNoiseL2Loss=0.0709
+ throughput/total_tokens=2,259,648,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11770/500000]
+ train/ActionNoiseL2Loss=0.0371
+ throughput/total_tokens=2,259,840,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11771/500000]
+ train/ActionNoiseL2Loss=0.0865
+ throughput/total_tokens=2,260,032,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11772/500000]
+ train/ActionNoiseL2Loss=0.0538
+ throughput/total_tokens=2,260,224,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11773/500000]
+ train/ActionNoiseL2Loss=0.0505
+ throughput/total_tokens=2,260,416,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11774/500000]
+ train/ActionNoiseL2Loss=0.0296
+ throughput/total_tokens=2,260,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11775/500000]
+ train/ActionNoiseL2Loss=0.0354
+ throughput/total_tokens=2,260,800,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11776/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,260,992,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11777/500000]
+ train/ActionNoiseL2Loss=0.1028
+ throughput/total_tokens=2,261,184,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11778/500000]
+ train/ActionNoiseL2Loss=0.0529
+ throughput/total_tokens=2,261,376,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11779/500000]
+ train/ActionNoiseL2Loss=0.0492
+ throughput/total_tokens=2,261,568,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11780/500000]
+ optim/total_grad_norm=0.7575
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=2,261,760,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11781/500000]
+ train/ActionNoiseL2Loss=0.0689
+ throughput/total_tokens=2,261,952,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11782/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,262,144,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11783/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,262,336,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11784/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,262,528,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11785/500000]
+ train/ActionNoiseL2Loss=0.1007
+ throughput/total_tokens=2,262,720,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11786/500000]
+ train/ActionNoiseL2Loss=0.0639
+ throughput/total_tokens=2,262,912,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11787/500000]
+ train/ActionNoiseL2Loss=0.0898
+ throughput/total_tokens=2,263,104,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11788/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,263,296,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11789/500000]
+ train/ActionNoiseL2Loss=0.0628
+ throughput/total_tokens=2,263,488,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11790/500000]
+ train/ActionNoiseL2Loss=0.1085
+ throughput/total_tokens=2,263,680,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11791/500000]
+ train/ActionNoiseL2Loss=0.0643
+ throughput/total_tokens=2,263,872,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11792/500000]
+ train/ActionNoiseL2Loss=0.0648
+ throughput/total_tokens=2,264,064,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11793/500000]
+ train/ActionNoiseL2Loss=0.0637
+ throughput/total_tokens=2,264,256,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11794/500000]
+ train/ActionNoiseL2Loss=0.0392
+ throughput/total_tokens=2,264,448,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11795/500000]
+ train/ActionNoiseL2Loss=0.0945
+ throughput/total_tokens=2,264,640,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11796/500000]
+ train/ActionNoiseL2Loss=0.0667
+ throughput/total_tokens=2,264,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11797/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,265,024,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11798/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=2,265,216,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11799/500000]
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,265,408,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11800/500000]
+ optim/total_grad_norm=1.016
+ train/ActionNoiseL2Loss=0.0445
+ throughput/total_tokens=2,265,600,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11801/500000]
+ train/ActionNoiseL2Loss=0.0410
+ throughput/total_tokens=2,265,792,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11802/500000]
+ train/ActionNoiseL2Loss=0.0521
+ throughput/total_tokens=2,265,984,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11803/500000]
+ train/ActionNoiseL2Loss=0.0582
+ throughput/total_tokens=2,266,176,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11804/500000]
+ train/ActionNoiseL2Loss=0.0495
+ throughput/total_tokens=2,266,368,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11805/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,266,560,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11806/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=2,266,752,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11807/500000]
+ train/ActionNoiseL2Loss=0.0304
+ throughput/total_tokens=2,266,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11808/500000]
+ train/ActionNoiseL2Loss=0.0547
+ throughput/total_tokens=2,267,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11809/500000]
+ train/ActionNoiseL2Loss=0.0686
+ throughput/total_tokens=2,267,328,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11810/500000]
+ train/ActionNoiseL2Loss=0.0551
+ throughput/total_tokens=2,267,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11811/500000]
+ train/ActionNoiseL2Loss=0.0719
+ throughput/total_tokens=2,267,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11812/500000]
+ train/ActionNoiseL2Loss=0.0427
+ throughput/total_tokens=2,267,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11813/500000]
+ train/ActionNoiseL2Loss=0.1140
+ throughput/total_tokens=2,268,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11814/500000]
+ train/ActionNoiseL2Loss=0.0416
+ throughput/total_tokens=2,268,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11815/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=2,268,480,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11816/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,268,672,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11817/500000]
+ train/ActionNoiseL2Loss=0.0894
+ throughput/total_tokens=2,268,864,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11818/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,269,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11819/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,269,248,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11820/500000]
+ optim/total_grad_norm=0.6242
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,269,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11821/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,269,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11822/500000]
+ train/ActionNoiseL2Loss=0.0358
+ throughput/total_tokens=2,269,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11823/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,270,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11824/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=2,270,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11825/500000]
+ train/ActionNoiseL2Loss=0.0469
+ throughput/total_tokens=2,270,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11826/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=2,270,592,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11827/500000]
+ train/ActionNoiseL2Loss=0.0479
+ throughput/total_tokens=2,270,784,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11828/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,270,976,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11829/500000]
+ train/ActionNoiseL2Loss=0.0509
+ throughput/total_tokens=2,271,168,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11830/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,271,360,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11831/500000]
+ train/ActionNoiseL2Loss=0.0368
+ throughput/total_tokens=2,271,552,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11832/500000]
+ train/ActionNoiseL2Loss=0.0753
+ throughput/total_tokens=2,271,744,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11833/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,271,936,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11834/500000]
+ train/ActionNoiseL2Loss=0.0571
+ throughput/total_tokens=2,272,128,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11835/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=2,272,320,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11836/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=2,272,512,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11837/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=2,272,704,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11838/500000]
+ train/ActionNoiseL2Loss=0.0407
+ throughput/total_tokens=2,272,896,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11839/500000]
+ train/ActionNoiseL2Loss=0.0595
+ throughput/total_tokens=2,273,088,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11840/500000]
+ optim/total_grad_norm=0.8923
+ train/ActionNoiseL2Loss=0.0785
+ throughput/total_tokens=2,273,280,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11841/500000]
+ train/ActionNoiseL2Loss=0.0763
+ throughput/total_tokens=2,273,472,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11842/500000]
+ train/ActionNoiseL2Loss=0.0284
+ throughput/total_tokens=2,273,664,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11843/500000]
+ train/ActionNoiseL2Loss=0.0476
+ throughput/total_tokens=2,273,856,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11844/500000]
+ train/ActionNoiseL2Loss=0.0645
+ throughput/total_tokens=2,274,048,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11845/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,274,240,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11846/500000]
+ train/ActionNoiseL2Loss=0.1173
+ throughput/total_tokens=2,274,432,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11847/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=2,274,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11848/500000]
+ train/ActionNoiseL2Loss=0.0537
+ throughput/total_tokens=2,274,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11849/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,275,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11850/500000]
+ train/ActionNoiseL2Loss=0.0611
+ throughput/total_tokens=2,275,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11851/500000]
+ train/ActionNoiseL2Loss=0.0390
+ throughput/total_tokens=2,275,392,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11852/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=2,275,584,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11853/500000]
+ train/ActionNoiseL2Loss=0.0312
+ throughput/total_tokens=2,275,776,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11854/500000]
+ train/ActionNoiseL2Loss=0.0372
+ throughput/total_tokens=2,275,968,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11855/500000]
+ train/ActionNoiseL2Loss=0.0347
+ throughput/total_tokens=2,276,160,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11856/500000]
+ train/ActionNoiseL2Loss=0.0723
+ throughput/total_tokens=2,276,352,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11857/500000]
+ train/ActionNoiseL2Loss=0.0669
+ throughput/total_tokens=2,276,544,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11858/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,276,736,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11859/500000]
+ train/ActionNoiseL2Loss=0.0400
+ throughput/total_tokens=2,276,928,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11860/500000]
+ optim/total_grad_norm=0.7685
+ train/ActionNoiseL2Loss=0.0398
+ throughput/total_tokens=2,277,120,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=11861/500000]
+ train/ActionNoiseL2Loss=0.0446
+ throughput/total_tokens=2,277,312,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=11862/500000]
+ train/ActionNoiseL2Loss=0.1046
+ throughput/total_tokens=2,277,504,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11863/500000]
+ train/ActionNoiseL2Loss=0.0759
+ throughput/total_tokens=2,277,696,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11864/500000]
+ train/ActionNoiseL2Loss=0.1363
+ throughput/total_tokens=2,277,888,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11865/500000]
+ train/ActionNoiseL2Loss=0.0730
+ throughput/total_tokens=2,278,080,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11866/500000]
+ train/ActionNoiseL2Loss=0.0620
+ throughput/total_tokens=2,278,272,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11867/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,278,464,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11868/500000]
+ train/ActionNoiseL2Loss=0.0737
+ throughput/total_tokens=2,278,656,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11869/500000]
+ train/ActionNoiseL2Loss=0.0391
+ throughput/total_tokens=2,278,848,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=11870/500000]
+ train/ActionNoiseL2Loss=0.0774
+ throughput/total_tokens=2,279,040,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11871/500000]
+ train/ActionNoiseL2Loss=0.0305
+ throughput/total_tokens=2,279,232,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11872/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=2,279,424,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11873/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,279,616,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11874/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,279,808,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11875/500000]
+ train/ActionNoiseL2Loss=0.0896
+ throughput/total_tokens=2,280,000,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11876/500000]
+ train/ActionNoiseL2Loss=0.0494
+ throughput/total_tokens=2,280,192,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11877/500000]
+ train/ActionNoiseL2Loss=0.0662
+ throughput/total_tokens=2,280,384,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11878/500000]
+ train/ActionNoiseL2Loss=0.0786
+ throughput/total_tokens=2,280,576,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11879/500000]
+ train/ActionNoiseL2Loss=0.0356
+ throughput/total_tokens=2,280,768,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11880/500000]
+ optim/total_grad_norm=0.5680
+ train/ActionNoiseL2Loss=0.0516
+ throughput/total_tokens=2,280,960,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11881/500000]
+ train/ActionNoiseL2Loss=0.0361
+ throughput/total_tokens=2,281,152,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11882/500000]
+ train/ActionNoiseL2Loss=0.0408
+ throughput/total_tokens=2,281,344,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11883/500000]
+ train/ActionNoiseL2Loss=0.0569
+ throughput/total_tokens=2,281,536,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11884/500000]
+ train/ActionNoiseL2Loss=0.0782
+ throughput/total_tokens=2,281,728,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11885/500000]
+ train/ActionNoiseL2Loss=0.0394
+ throughput/total_tokens=2,281,920,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11886/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=2,282,112,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11887/500000]
+ train/ActionNoiseL2Loss=0.0317
+ throughput/total_tokens=2,282,304,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11888/500000]
+ train/ActionNoiseL2Loss=0.0493
+ throughput/total_tokens=2,282,496,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11889/500000]
+ train/ActionNoiseL2Loss=0.0751
+ throughput/total_tokens=2,282,688,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11890/500000]
+ train/ActionNoiseL2Loss=0.0836
+ throughput/total_tokens=2,282,880,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11891/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,283,072,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11892/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,283,264,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11893/500000]
+ train/ActionNoiseL2Loss=0.1183
+ throughput/total_tokens=2,283,456,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11894/500000]
+ train/ActionNoiseL2Loss=0.0431
+ throughput/total_tokens=2,283,648,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11895/500000]
+ train/ActionNoiseL2Loss=0.0755
+ throughput/total_tokens=2,283,840,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11896/500000]
+ train/ActionNoiseL2Loss=0.0111
+ throughput/total_tokens=2,284,032,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11897/500000]
+ train/ActionNoiseL2Loss=0.0831
+ throughput/total_tokens=2,284,224,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0480
+[step=11898/500000]
+ train/ActionNoiseL2Loss=0.0726
+ throughput/total_tokens=2,284,416,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11899/500000]
+ train/ActionNoiseL2Loss=0.0384
+ throughput/total_tokens=2,284,608,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11900/500000]
+ optim/total_grad_norm=0.5991
+ train/ActionNoiseL2Loss=0.0687
+ throughput/total_tokens=2,284,800,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11901/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,284,992,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11902/500000]
+ train/ActionNoiseL2Loss=0.0539
+ throughput/total_tokens=2,285,184,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11903/500000]
+ train/ActionNoiseL2Loss=0.0432
+ throughput/total_tokens=2,285,376,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11904/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,285,568,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11905/500000]
+ train/ActionNoiseL2Loss=0.0262
+ throughput/total_tokens=2,285,760,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11906/500000]
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,285,952,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11907/500000]
+ train/ActionNoiseL2Loss=0.0531
+ throughput/total_tokens=2,286,144,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11908/500000]
+ train/ActionNoiseL2Loss=0.0941
+ throughput/total_tokens=2,286,336,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11909/500000]
+ train/ActionNoiseL2Loss=0.0790
+ throughput/total_tokens=2,286,528,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11910/500000]
+ train/ActionNoiseL2Loss=0.0666
+ throughput/total_tokens=2,286,720,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11911/500000]
+ train/ActionNoiseL2Loss=0.0653
+ throughput/total_tokens=2,286,912,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11912/500000]
+ train/ActionNoiseL2Loss=0.0477
+ throughput/total_tokens=2,287,104,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11913/500000]
+ train/ActionNoiseL2Loss=0.0610
+ throughput/total_tokens=2,287,296,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11914/500000]
+ train/ActionNoiseL2Loss=0.0778
+ throughput/total_tokens=2,287,488,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11915/500000]
+ train/ActionNoiseL2Loss=0.0738
+ throughput/total_tokens=2,287,680,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=11916/500000]
+ train/ActionNoiseL2Loss=0.0468
+ throughput/total_tokens=2,287,872,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11917/500000]
+ train/ActionNoiseL2Loss=0.0287
+ throughput/total_tokens=2,288,064,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11918/500000]
+ train/ActionNoiseL2Loss=0.0462
+ throughput/total_tokens=2,288,256,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11919/500000]
+ train/ActionNoiseL2Loss=0.0608
+ throughput/total_tokens=2,288,448,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11920/500000]
+ optim/total_grad_norm=0.4379
+ train/ActionNoiseL2Loss=0.0487
+ throughput/total_tokens=2,288,640,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11921/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=2,288,832,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11922/500000]
+ train/ActionNoiseL2Loss=0.0501
+ throughput/total_tokens=2,289,024,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11923/500000]
+ train/ActionNoiseL2Loss=0.0765
+ throughput/total_tokens=2,289,216,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11924/500000]
+ train/ActionNoiseL2Loss=0.0319
+ throughput/total_tokens=2,289,408,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11925/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=2,289,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11926/500000]
+ train/ActionNoiseL2Loss=0.0846
+ throughput/total_tokens=2,289,792,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11927/500000]
+ train/ActionNoiseL2Loss=0.0545
+ throughput/total_tokens=2,289,984,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11928/500000]
+ train/ActionNoiseL2Loss=0.0631
+ throughput/total_tokens=2,290,176,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11929/500000]
+ train/ActionNoiseL2Loss=0.0452
+ throughput/total_tokens=2,290,368,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11930/500000]
+ train/ActionNoiseL2Loss=0.0210
+ throughput/total_tokens=2,290,560,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11931/500000]
+ train/ActionNoiseL2Loss=0.0756
+ throughput/total_tokens=2,290,752,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11932/500000]
+ train/ActionNoiseL2Loss=0.0593
+ throughput/total_tokens=2,290,944,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11933/500000]
+ train/ActionNoiseL2Loss=0.0429
+ throughput/total_tokens=2,291,136,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11934/500000]
+ train/ActionNoiseL2Loss=0.0824
+ throughput/total_tokens=2,291,328,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11935/500000]
+ train/ActionNoiseL2Loss=0.0209
+ throughput/total_tokens=2,291,520,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11936/500000]
+ train/ActionNoiseL2Loss=0.0510
+ throughput/total_tokens=2,291,712,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11937/500000]
+ train/ActionNoiseL2Loss=0.0359
+ throughput/total_tokens=2,291,904,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11938/500000]
+ train/ActionNoiseL2Loss=0.0309
+ throughput/total_tokens=2,292,096,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11939/500000]
+ train/ActionNoiseL2Loss=0.0660
+ throughput/total_tokens=2,292,288,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11940/500000]
+ optim/total_grad_norm=0.6027
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,292,480,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11941/500000]
+ train/ActionNoiseL2Loss=0.0716
+ throughput/total_tokens=2,292,672,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11942/500000]
+ train/ActionNoiseL2Loss=0.0441
+ throughput/total_tokens=2,292,864,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11943/500000]
+ train/ActionNoiseL2Loss=0.1082
+ throughput/total_tokens=2,293,056,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11944/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,293,248,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11945/500000]
+ train/ActionNoiseL2Loss=0.0703
+ throughput/total_tokens=2,293,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11946/500000]
+ train/ActionNoiseL2Loss=0.0783
+ throughput/total_tokens=2,293,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11947/500000]
+ train/ActionNoiseL2Loss=0.0557
+ throughput/total_tokens=2,293,824,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11948/500000]
+ train/ActionNoiseL2Loss=0.0572
+ throughput/total_tokens=2,294,016,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11949/500000]
+ train/ActionNoiseL2Loss=0.0402
+ throughput/total_tokens=2,294,208,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=11950/500000]
+ train/ActionNoiseL2Loss=0.0677
+ throughput/total_tokens=2,294,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11951/500000]
+ train/ActionNoiseL2Loss=0.0373
+ throughput/total_tokens=2,294,592,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11952/500000]
+ train/ActionNoiseL2Loss=0.0460
+ throughput/total_tokens=2,294,784,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11953/500000]
+ train/ActionNoiseL2Loss=0.0437
+ throughput/total_tokens=2,294,976,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11954/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,295,168,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=11955/500000]
+ train/ActionNoiseL2Loss=0.0950
+ throughput/total_tokens=2,295,360,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11956/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=2,295,552,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11957/500000]
+ train/ActionNoiseL2Loss=0.0497
+ throughput/total_tokens=2,295,744,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11958/500000]
+ train/ActionNoiseL2Loss=0.0217
+ throughput/total_tokens=2,295,936,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11959/500000]
+ train/ActionNoiseL2Loss=0.0623
+ throughput/total_tokens=2,296,128,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11960/500000]
+ optim/total_grad_norm=0.6215
+ train/ActionNoiseL2Loss=0.0415
+ throughput/total_tokens=2,296,320,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=11961/500000]
+ train/ActionNoiseL2Loss=0.0474
+ throughput/total_tokens=2,296,512,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11962/500000]
+ train/ActionNoiseL2Loss=0.0345
+ throughput/total_tokens=2,296,704,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11963/500000]
+ train/ActionNoiseL2Loss=0.0423
+ throughput/total_tokens=2,296,896,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11964/500000]
+ train/ActionNoiseL2Loss=0.0428
+ throughput/total_tokens=2,297,088,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11965/500000]
+ train/ActionNoiseL2Loss=0.0612
+ throughput/total_tokens=2,297,280,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11966/500000]
+ train/ActionNoiseL2Loss=0.0570
+ throughput/total_tokens=2,297,472,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11967/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,297,664,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11968/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,297,856,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=11969/500000]
+ train/ActionNoiseL2Loss=0.0291
+ throughput/total_tokens=2,298,048,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=11970/500000]
+ train/ActionNoiseL2Loss=0.0754
+ throughput/total_tokens=2,298,240,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11971/500000]
+ train/ActionNoiseL2Loss=0.0463
+ throughput/total_tokens=2,298,432,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11972/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,298,624,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11973/500000]
+ train/ActionNoiseL2Loss=0.0748
+ throughput/total_tokens=2,298,816,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11974/500000]
+ train/ActionNoiseL2Loss=0.0375
+ throughput/total_tokens=2,299,008,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11975/500000]
+ train/ActionNoiseL2Loss=0.0708
+ throughput/total_tokens=2,299,200,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11976/500000]
+ train/ActionNoiseL2Loss=0.0622
+ throughput/total_tokens=2,299,392,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11977/500000]
+ train/ActionNoiseL2Loss=0.0270
+ throughput/total_tokens=2,299,584,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11978/500000]
+ train/ActionNoiseL2Loss=0.0503
+ throughput/total_tokens=2,299,776,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11979/500000]
+ train/ActionNoiseL2Loss=0.1008
+ throughput/total_tokens=2,299,968,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11980/500000]
+ optim/total_grad_norm=0.6785
+ train/ActionNoiseL2Loss=0.0534
+ throughput/total_tokens=2,300,160,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11981/500000]
+ train/ActionNoiseL2Loss=0.0828
+ throughput/total_tokens=2,300,352,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11982/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=2,300,544,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11983/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=2,300,736,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11984/500000]
+ train/ActionNoiseL2Loss=0.0530
+ throughput/total_tokens=2,300,928,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11985/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=2,301,120,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11986/500000]
+ train/ActionNoiseL2Loss=0.0671
+ throughput/total_tokens=2,301,312,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11987/500000]
+ train/ActionNoiseL2Loss=0.0404
+ throughput/total_tokens=2,301,504,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11988/500000]
+ train/ActionNoiseL2Loss=0.0681
+ throughput/total_tokens=2,301,696,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11989/500000]
+ train/ActionNoiseL2Loss=0.0858
+ throughput/total_tokens=2,301,888,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11990/500000]
+ train/ActionNoiseL2Loss=0.0519
+ throughput/total_tokens=2,302,080,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=11991/500000]
+ train/ActionNoiseL2Loss=0.0590
+ throughput/total_tokens=2,302,272,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=11992/500000]
+ train/ActionNoiseL2Loss=0.0341
+ throughput/total_tokens=2,302,464,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11993/500000]
+ train/ActionNoiseL2Loss=0.0626
+ throughput/total_tokens=2,302,656,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11994/500000]
+ train/ActionNoiseL2Loss=0.0577
+ throughput/total_tokens=2,302,848,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11995/500000]
+ train/ActionNoiseL2Loss=0.0457
+ throughput/total_tokens=2,303,040,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11996/500000]
+ train/ActionNoiseL2Loss=0.1267
+ throughput/total_tokens=2,303,232,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=11997/500000]
+ train/ActionNoiseL2Loss=0.0367
+ throughput/total_tokens=2,303,424,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11998/500000]
+ train/ActionNoiseL2Loss=0.0409
+ throughput/total_tokens=2,303,616,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=11999/500000]
+ train/ActionNoiseL2Loss=0.0553
+ throughput/total_tokens=2,303,808,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12000/500000]
+ optim/total_grad_norm=0.7690
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,304,000,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+10/14 [16:06:24] INFO | >> Saving config... checkpoint.py:608
+10/14 [16:07:05] INFO | >> Saving model state... checkpoint.py:796
+10/14 [16:08:25] INFO | >> Saving optim state... checkpoint.py:811
+10/14 [16:09:58] INFO | >> Saving trainer state... checkpoint.py:670
+ INFO | >> Saving config... checkpoint.py:608
+[step=12001/500000]
+ train/ActionNoiseL2Loss=0.0472
+ throughput/total_tokens=2,304,192,000
+ throughput/device/tokens_per_second=1,133
+ throughput/device/batches_per_second=0.0472
+[step=12002/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,304,384,000
+ throughput/device/tokens_per_second=1,132
+ throughput/device/batches_per_second=0.0472
+[step=12003/500000]
+ train/ActionNoiseL2Loss=0.0499
+ throughput/total_tokens=2,304,576,000
+ throughput/device/tokens_per_second=1,134
+ throughput/device/batches_per_second=0.0473
+[step=12004/500000]
+ train/ActionNoiseL2Loss=0.0447
+ throughput/total_tokens=2,304,768,000
+ throughput/device/tokens_per_second=1,139
+ throughput/device/batches_per_second=0.0475
+[step=12005/500000]
+ train/ActionNoiseL2Loss=0.0419
+ throughput/total_tokens=2,304,960,000
+ throughput/device/tokens_per_second=1,141
+ throughput/device/batches_per_second=0.0476
+[step=12006/500000]
+ train/ActionNoiseL2Loss=0.0860
+ throughput/total_tokens=2,305,152,000
+ throughput/device/tokens_per_second=1,144
+ throughput/device/batches_per_second=0.0477
+[step=12007/500000]
+ train/ActionNoiseL2Loss=0.0568
+ throughput/total_tokens=2,305,344,000
+ throughput/device/tokens_per_second=1,145
+ throughput/device/batches_per_second=0.0477
+[step=12008/500000]
+ train/ActionNoiseL2Loss=0.0502
+ throughput/total_tokens=2,305,536,000
+ throughput/device/tokens_per_second=1,146
+ throughput/device/batches_per_second=0.0478
+[step=12009/500000]
+ train/ActionNoiseL2Loss=0.1125
+ throughput/total_tokens=2,305,728,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+[step=12010/500000]
+ train/ActionNoiseL2Loss=0.0564
+ throughput/total_tokens=2,305,920,000
+ throughput/device/tokens_per_second=1,147
+ throughput/device/batches_per_second=0.0478
+ System/Peak GPU Memory (MB)=51,074
+[step=12011/500000]
+ train/ActionNoiseL2Loss=0.0559
+ throughput/total_tokens=2,306,112,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12012/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,306,304,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12013/500000]
+ train/ActionNoiseL2Loss=0.0728
+ throughput/total_tokens=2,306,496,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12014/500000]
+ train/ActionNoiseL2Loss=0.0758
+ throughput/total_tokens=2,306,688,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12015/500000]
+ train/ActionNoiseL2Loss=0.0652
+ throughput/total_tokens=2,306,880,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12016/500000]
+ train/ActionNoiseL2Loss=0.0934
+ throughput/total_tokens=2,307,072,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12017/500000]
+ train/ActionNoiseL2Loss=0.0600
+ throughput/total_tokens=2,307,264,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=12018/500000]
+ train/ActionNoiseL2Loss=0.1004
+ throughput/total_tokens=2,307,456,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=12019/500000]
+ train/ActionNoiseL2Loss=0.0456
+ throughput/total_tokens=2,307,648,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=12020/500000]
+ optim/total_grad_norm=1.094
+ train/ActionNoiseL2Loss=0.0871
+ throughput/total_tokens=2,307,840,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=12021/500000]
+ train/ActionNoiseL2Loss=0.0563
+ throughput/total_tokens=2,308,032,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12022/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,308,224,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12023/500000]
+ train/ActionNoiseL2Loss=0.0798
+ throughput/total_tokens=2,308,416,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=12024/500000]
+ train/ActionNoiseL2Loss=0.0541
+ throughput/total_tokens=2,308,608,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=12025/500000]
+ train/ActionNoiseL2Loss=0.0221
+ throughput/total_tokens=2,308,800,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12026/500000]
+ train/ActionNoiseL2Loss=0.0426
+ throughput/total_tokens=2,308,992,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12027/500000]
+ train/ActionNoiseL2Loss=0.0624
+ throughput/total_tokens=2,309,184,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12028/500000]
+ train/ActionNoiseL2Loss=0.0528
+ throughput/total_tokens=2,309,376,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12029/500000]
+ train/ActionNoiseL2Loss=0.0562
+ throughput/total_tokens=2,309,568,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12030/500000]
+ train/ActionNoiseL2Loss=0.0597
+ throughput/total_tokens=2,309,760,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=12031/500000]
+ train/ActionNoiseL2Loss=0.0688
+ throughput/total_tokens=2,309,952,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12032/500000]
+ train/ActionNoiseL2Loss=0.0591
+ throughput/total_tokens=2,310,144,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12033/500000]
+ train/ActionNoiseL2Loss=0.1181
+ throughput/total_tokens=2,310,336,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12034/500000]
+ train/ActionNoiseL2Loss=0.0817
+ throughput/total_tokens=2,310,528,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12035/500000]
+ train/ActionNoiseL2Loss=0.0614
+ throughput/total_tokens=2,310,720,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12036/500000]
+ train/ActionNoiseL2Loss=0.0425
+ throughput/total_tokens=2,310,912,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12037/500000]
+ train/ActionNoiseL2Loss=0.0596
+ throughput/total_tokens=2,311,104,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12038/500000]
+ train/ActionNoiseL2Loss=0.0691
+ throughput/total_tokens=2,311,296,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12039/500000]
+ train/ActionNoiseL2Loss=0.0532
+ throughput/total_tokens=2,311,488,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12040/500000]
+ optim/total_grad_norm=0.6786
+ train/ActionNoiseL2Loss=0.0413
+ throughput/total_tokens=2,311,680,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=12041/500000]
+ train/ActionNoiseL2Loss=0.0649
+ throughput/total_tokens=2,311,872,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12042/500000]
+ train/ActionNoiseL2Loss=0.0814
+ throughput/total_tokens=2,312,064,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12043/500000]
+ train/ActionNoiseL2Loss=0.0707
+ throughput/total_tokens=2,312,256,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=12044/500000]
+ train/ActionNoiseL2Loss=0.0433
+ throughput/total_tokens=2,312,448,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12045/500000]
+ train/ActionNoiseL2Loss=0.0403
+ throughput/total_tokens=2,312,640,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0480
+[step=12046/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,312,832,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12047/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=2,313,024,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12048/500000]
+ train/ActionNoiseL2Loss=0.0504
+ throughput/total_tokens=2,313,216,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12049/500000]
+ train/ActionNoiseL2Loss=0.0607
+ throughput/total_tokens=2,313,408,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+[step=12050/500000]
+ train/ActionNoiseL2Loss=0.0658
+ throughput/total_tokens=2,313,600,000
+ throughput/device/tokens_per_second=1,153
+ throughput/device/batches_per_second=0.0481
+ System/Peak GPU Memory (MB)=51,074
+[step=12051/500000]
+ train/ActionNoiseL2Loss=0.0430
+ throughput/total_tokens=2,313,792,000
+ throughput/device/tokens_per_second=1,150
+ throughput/device/batches_per_second=0.0479
+[step=12052/500000]
+ train/ActionNoiseL2Loss=0.0253
+ throughput/total_tokens=2,313,984,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12053/500000]
+ train/ActionNoiseL2Loss=0.0670
+ throughput/total_tokens=2,314,176,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12054/500000]
+ train/ActionNoiseL2Loss=0.0700
+ throughput/total_tokens=2,314,368,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12055/500000]
+ train/ActionNoiseL2Loss=0.0473
+ throughput/total_tokens=2,314,560,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12056/500000]
+ train/ActionNoiseL2Loss=0.0672
+ throughput/total_tokens=2,314,752,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12057/500000]
+ train/ActionNoiseL2Loss=0.0337
+ throughput/total_tokens=2,314,944,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12058/500000]
+ train/ActionNoiseL2Loss=0.0451
+ throughput/total_tokens=2,315,136,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12059/500000]
+ train/ActionNoiseL2Loss=0.0693
+ throughput/total_tokens=2,315,328,000
+ throughput/device/tokens_per_second=1,149
+ throughput/device/batches_per_second=0.0479
+[step=12060/500000]
+ optim/total_grad_norm=0.6350
+ train/ActionNoiseL2Loss=0.0482
+ throughput/total_tokens=2,315,520,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+ System/Peak GPU Memory (MB)=51,074
+[step=12061/500000]
+ train/ActionNoiseL2Loss=0.0485
+ throughput/total_tokens=2,315,712,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12062/500000]
+ train/ActionNoiseL2Loss=0.0598
+ throughput/total_tokens=2,315,904,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12063/500000]
+ train/ActionNoiseL2Loss=0.0542
+ throughput/total_tokens=2,316,096,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12064/500000]
+ train/ActionNoiseL2Loss=0.0679
+ throughput/total_tokens=2,316,288,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12065/500000]
+ train/ActionNoiseL2Loss=0.0448
+ throughput/total_tokens=2,316,480,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12066/500000]
+ train/ActionNoiseL2Loss=0.0508
+ throughput/total_tokens=2,316,672,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12067/500000]
+ train/ActionNoiseL2Loss=0.0807
+ throughput/total_tokens=2,316,864,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0479
+[step=12068/500000]
+ train/ActionNoiseL2Loss=0.0388
+ throughput/total_tokens=2,317,056,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=12069/500000]
+ train/ActionNoiseL2Loss=0.0334
+ throughput/total_tokens=2,317,248,000
+ throughput/device/tokens_per_second=1,148
+ throughput/device/batches_per_second=0.0478
+[step=12070/500000]
+ train/ActionNoiseL2Loss=0.0567
+ throughput/total_tokens=2,317,440,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+ System/Peak GPU Memory (MB)=51,074
+[step=12071/500000]
+ train/ActionNoiseL2Loss=0.0471
+ throughput/total_tokens=2,317,632,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12072/500000]
+ train/ActionNoiseL2Loss=0.0641
+ throughput/total_tokens=2,317,824,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12073/500000]
+ train/ActionNoiseL2Loss=0.0642
+ throughput/total_tokens=2,318,016,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12074/500000]
+ train/ActionNoiseL2Loss=0.0731
+ throughput/total_tokens=2,318,208,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12075/500000]
+ train/ActionNoiseL2Loss=0.0444
+ throughput/total_tokens=2,318,400,000
+ throughput/device/tokens_per_second=1,151
+ throughput/device/batches_per_second=0.0480
+[step=12076/500000]
+ train/ActionNoiseL2Loss=0.0922
+ throughput/total_tokens=2,318,592,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12077/500000]
+ train/ActionNoiseL2Loss=0.0664
+ throughput/total_tokens=2,318,784,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
+[step=12078/500000]
+ train/ActionNoiseL2Loss=0.0526
+ throughput/total_tokens=2,318,976,000
+ throughput/device/tokens_per_second=1,152
+ throughput/device/batches_per_second=0.0480
diff --git a/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/files/requirements.txt b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/files/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8
--- /dev/null
+++ b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/files/requirements.txt
@@ -0,0 +1,286 @@
+ai2-molmo==0.0.0
+astunparse==1.6.3
+flatbuffers==25.2.10
+gast==0.6.0
+google-pasta==0.2.0
+h5py==3.14.0
+libclang==18.1.1
+Markdown==3.9
+namex==0.1.0
+opt_einsum==3.4.0
+optree==0.17.0
+tensorboard-data-server==0.7.2
+tensorflow-io-gcs-filesystem==0.37.1
+termcolor==3.1.0
+Werkzeug==3.1.3
+Brotli==1.1.0
+Farama-Notifications==0.0.4
+MarkupSafe==2.1.5
+PyYAML==6.0.2
+absl-py==2.3.1
+accelerate==1.10.1
+ai2-molmo==0.0.0
+aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.15
+aiosignal==1.4.0
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+anyio==4.10.0
+array_record==0.8.1
+async-timeout==5.0.1
+attrs==25.3.0
+av==15.1.0
+backports.tarfile==1.2.0
+beaker-gantry==3.2.0
+beaker-py==2.5.0
+black==23.12.1
+blinker==1.9.0
+boltons==25.0.0
+boto3==1.40.33
+botocore==1.40.33
+build==1.3.0
+cached_path==1.7.3
+cached-property==2.0.1
+cachetools==5.5.2
+certifi==2025.8.3
+cffi==2.0.0
+charset-normalizer==3.4.3
+click==8.2.1
+click-help-colors==0.9.4
+click-option-group==0.5.7
+cloudpickle==3.1.1
+cmake==4.1.0
+contourpy==1.3.2
+cryptography==46.0.1
+cycler==0.12.1
+dataclass-extensions==0.2.3
+datasets==3.6.0
+decorator==5.2.1
+deepdiff==8.6.1
+diffusers==0.35.1
+dill==0.3.8
+distro==1.9.0
+dlimp==0.0.1
+dm-tree==0.1.9
+docutils==0.22.1
+draccus==0.10.0
+editdistance==0.8.1
+einops==0.8.1
+einops-exts==0.0.4
+et_xmlfile==2.0.0
+etils==1.13.0
+evdev==1.9.2
+exceptiongroup==1.3.0
+face==24.0.0
+fastapi==0.116.2
+ffmpy==0.6.1
+fiddle==0.3.0
+filelock==3.13.1
+Flask==3.1.2
+fonttools==4.60.0
+frozenlist==1.7.0
+fsspec==2023.9.2
+ftfy==6.3.1
+gcsfs==2023.9.2
+gitdb==4.0.12
+GitPython==3.1.45
+glom==24.11.0
+google-api-core==2.25.1
+google-auth==2.40.3
+google-auth-oauthlib==1.2.2
+google-cloud-core==2.4.3
+google-cloud-storage==2.19.0
+google-crc32c==1.7.1
+google-resumable-media==2.7.2
+googleapis-common-protos==1.70.0
+gradio==5.46.0
+gradio_client==1.13.0
+graphviz==0.21
+groovy==0.1.2
+grpcio==1.75.0
+gymnasium==0.29.1
+h11==0.16.0
+hf_transfer==0.1.9
+hf-xet==1.1.10
+httpcore==1.0.9
+httpx==0.28.1
+huggingface-hub==0.35.0
+id==1.5.0
+idna==3.10
+imageio==2.37.0
+imageio-ffmpeg==0.6.0
+importlib_metadata==8.7.0
+importlib_resources==6.5.2
+iniconfig==2.1.0
+inquirerpy==0.3.4
+isort==5.12.0
+itsdangerous==2.2.0
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.3.0
+jeepney==0.9.0
+Jinja2==3.1.4
+jiter==0.11.0
+jmespath==1.0.1
+joblib==1.5.2
+jsonlines==4.0.0
+keras==2.15.0
+keyring==25.6.0
+kiwisolver==1.4.9
+latex2sympy2_extended==1.10.2
+lerobot==0.3.4
+Levenshtein==0.27.1
+libcst==1.8.4
+lightning-utilities==0.15.2
+markdown-it-py==4.0.0
+math-verify==0.8.0
+matplotlib==3.10.6
+mdurl==0.1.2
+mergedeep==1.3.4
+ml-dtypes==0.2.0
+ml_dtypes==0.5.3
+more-itertools==10.8.0
+mpmath==1.3.0
+msgspec==0.19.0
+multidict==6.6.4
+multiprocess==0.70.16
+mypy==1.3.0
+mypy_extensions==1.1.0
+necessary==0.4.3
+networkx==3.3
+nh3==0.3.0
+nltk==3.9.1
+numpy==1.26.4
+oauthlib==3.3.1
+omegaconf==2.3.0
+openai==1.108.0
+opencv-python-headless==4.12.0.88
+OpenEXR==3.4.0
+openpyxl==3.1.5
+orderly-set==5.5.0
+orjson==3.11.3
+packaging==25.0
+pandas==2.3.2
+pathspec==0.12.1
+petname==2.6
+pfzy==0.3.4
+pillow==11.0.0
+pip==25.2
+platformdirs==4.4.0
+pluggy==1.6.0
+promise==2.3
+prompt_toolkit==3.0.52
+propcache==0.3.2
+proto-plus==1.26.1
+protobuf==4.21.12
+protobuf==6.32.1
+psutil==7.1.0
+pyarrow==21.0.0
+pyasn1==0.6.1
+pyasn1_modules==0.4.2
+pycparser==2.23
+pydantic==2.11.9
+pydantic_core==2.33.2
+pydub==0.25.1
+Pygments==2.19.2
+pynput==1.8.1
+pyparsing==3.2.4
+pyproject_hooks==1.2.0
+pyserial==3.5
+pytest==8.4.2
+pytest-sphinx==0.6.3
+python-dateutil==2.9.0.post0
+python-Levenshtein==0.27.1
+python-multipart==0.0.20
+python-xlib==0.33
+pytorch-triton-rocm==3.4.0
+pytz==2025.2
+pyyaml-include==1.4.1
+RapidFuzz==3.14.1
+readme_renderer==44.0
+regex==2025.9.1
+requests==2.32.5
+requests-oauthlib==2.0.0
+requests-toolbelt==1.0.0
+requirements-parser==0.13.0
+rerun-sdk==0.22.1
+rfc3986==2.0.0
+rich==13.9.4
+rsa==4.9.1
+ruff==0.13.0
+s3transfer==0.14.0
+safehttpx==0.1.6
+safetensors==0.6.2
+scikit-learn==1.7.2
+scipy==1.15.3
+SecretStorage==3.4.0
+semantic-version==2.10.0
+sentencepiece==0.2.1
+sentry-sdk==2.38.0
+setuptools==78.1.1
+shellingham==1.5.4
+six==1.17.0
+smart_open==7.3.1
+smashed==0.21.5
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.48.0
+sympy==1.13.3
+tensorboard==2.15.2
+tensorboard==2.19.0
+tensorflow==2.15.0
+tensorflow-addons==0.23.0
+tensorflow-datasets==4.9.3
+tensorflow-estimator==2.15.0
+tensorflow-graphics==2021.12.3
+tensorflow-metadata==1.17.2
+threadpoolctl==3.6.0
+timm==1.0.19
+tokenizers==0.22.0
+toml==0.10.2
+tomli==2.2.1
+tomlkit==0.13.3
+torch==2.8.0+rocm6.4
+torchcodec==0.5
+torchmetrics==1.8.2
+torchvision==0.23.0+rocm6.4
+tqdm==4.67.1
+transformers==4.56.1
+trimesh==4.8.2
+trouting==0.3.3
+twine==6.2.0
+typeguard==2.13.3
+typer==0.17.4
+typing_extensions==4.15.0
+typing-inspect==0.9.0
+typing-inspection==0.4.1
+tzdata==2025.2
+urllib3==2.5.0
+uvicorn==0.35.0
+wandb==0.21.4
+wcwidth==0.2.13
+websockets==15.0.1
+wheel==0.45.1
+wrapt==1.14.2
+xxhash==3.5.0
+yarl==1.20.1
+zipp==3.23.0
+lerobot==0.3.4
+minLoRA==0.1.0
+autocommand==2.2.2
+backports.tarfile==1.2.0
+importlib_metadata==8.0.0
+inflect==7.3.1
+jaraco.collections==5.1.0
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+more-itertools==10.3.0
+packaging==24.2
+platformdirs==4.2.2
+tomli==2.0.1
+typeguard==4.3.0
+typing_extensions==4.12.2
+wheel==0.45.1
+zipp==3.19.2
diff --git a/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/files/wandb-metadata.json b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/files/wandb-metadata.json
new file mode 100644
index 0000000000000000000000000000000000000000..3d81403808126bb3f5e320734c6d35f1e5b80a32
--- /dev/null
+++ b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/files/wandb-metadata.json
@@ -0,0 +1,204 @@
+{
+ "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35",
+ "python": "CPython 3.10.18",
+ "startedAt": "2025-10-11T16:38:44.830364Z",
+ "args": [
+ "qwen2_7b",
+ "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/pen_flow_matching",
+ "--vision_backbone",
+ "openai",
+ "--action_head",
+ "flow_matching",
+ "--seq_len",
+ "1600",
+ "--ft_llm",
+ "--checkpoint",
+ "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924",
+ "--device_train_microbatch_size",
+ "16",
+ "--global_batch_size",
+ "126",
+ "--dataset",
+ "vla_dataset_realworld",
+ "--llm_learning_rate",
+ "5e-5",
+ "--wandb_entity",
+ "henryeap",
+ "--wandb_project",
+ "a1-realworld",
+ "--wandb_run_name",
+ "pen",
+ "--real_world_vla_config_path",
+ "vla_config_realworld/vla_config_pen.yaml",
+ "--save_overwrite"
+ ],
+ "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py",
+ "codePath": "launch_scripts/train_vla.py",
+ "codePathLocal": "launch_scripts/train_vla.py",
+ "git": {
+ "remote": "https://github.com/Spatialtemporal-AI/A1.git",
+ "commit": "7c171df5d31577ede69d05172c2bc62d42ef3e3d"
+ },
+ "email": "ihenrykwok@outlook.com",
+ "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/pen_flow_matching/wandb",
+ "host": "auh7-1b-gpu-253",
+ "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10",
+ "cpu_count": 64,
+ "cpu_count_logical": 128,
+ "gpu": "Instinct MI210",
+ "gpu_count": 8,
+ "disk": {
+ "/": {
+ "total": "3778763694080",
+ "used": "50589351936"
+ }
+ },
+ "memory": {
+ "total": "2434606940160"
+ },
+ "gpu_amd": [
+ {
+ "id": "7",
+ "uniqueId": "0x79f34beb0df1642b",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "1",
+ "uniqueId": "0xde7b3a3b0e7b52be",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "6",
+ "uniqueId": "0xe08249923e0a99ae",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "0",
+ "uniqueId": "0x6e39dcc60a37a155",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "5",
+ "uniqueId": "0xc01c66958a593461",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "3",
+ "uniqueId": "0x7d5ed86cf6c4a80a",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "4",
+ "uniqueId": "0x22f4e1ec1e4766a1",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ },
+ {
+ "id": "2",
+ "uniqueId": "0xe24ebd0f35014c51",
+ "vbiosVersion": "113-D67301V-073",
+ "performanceLevel": "auto",
+ "maxPower": "300.0",
+ "series": "Instinct MI210",
+ "model": "0x740f",
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
+ "sku": "D67301V",
+ "sclkRange": "500Mhz - 1700Mhz",
+ "mclkRange": "400Mhz - 1600Mhz"
+ }
+ ],
+ "slurm": {
+ "cluster_name": "ai-04r",
+ "conf": "/etc/slurm/slurm.conf",
+ "cpus_on_node": "128",
+ "gpus_on_node": "8",
+ "gtids": "0",
+ "job_account": "faculty-acc",
+ "job_cpus_per_node": "128",
+ "job_end_time": "1760459846",
+ "job_gid": "2000",
+ "job_gpus": "0,1,2,3,4,5,6,7",
+ "job_id": "2287",
+ "job_name": "mh_pen_flow_matching",
+ "job_nodelist": "auh7-1b-gpu-253",
+ "job_num_nodes": "1",
+ "job_partition": "faculty",
+ "job_qos": "xdqos",
+ "job_start_time": "1760200646",
+ "job_uid": "2013",
+ "job_user": "xiaodan",
+ "jobid": "2287",
+ "localid": "0",
+ "nnodes": "1",
+ "nodeid": "0",
+ "nodelist": "auh7-1b-gpu-253",
+ "nprocs": "1",
+ "ntasks": "1",
+ "ntasks_per_node": "1",
+ "oom_kill_step": "0",
+ "prio_process": "0",
+ "procid": "0",
+ "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts",
+ "submit_host": "auh-1b-cpu-login-001",
+ "task_pid": "411389",
+ "tasks_per_node": "1",
+ "topology_addr": "auh7-1b-gpu-253",
+ "topology_addr_pattern": "node"
+ },
+ "writerId": "c87r2obvd7qa3blbvewjvdehottl5rrr"
+}
\ No newline at end of file
diff --git a/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/logs/debug-core.log b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/logs/debug-core.log
new file mode 100644
index 0000000000000000000000000000000000000000..d7c22af20496037043449115975532679faf5cfc
--- /dev/null
+++ b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/logs/debug-core.log
@@ -0,0 +1,6 @@
+{"time":"2025-10-11T16:38:45.197330387Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpygij4s57/port-579278.txt","pid":579278,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
+{"time":"2025-10-11T16:38:45.198122306Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":579278}
+{"time":"2025-10-11T16:38:45.199702094Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-579278-579454-1269370264/socket","Net":"unix"}}
+{"time":"2025-10-11T16:38:45.353337002Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
+{"time":"2025-10-11T16:38:45.368049369Z","level":"INFO","msg":"handleInformInit: received","streamId":"qzez8pv7","id":"1(@)"}
+{"time":"2025-10-11T16:38:46.624632949Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"qzez8pv7","id":"1(@)"}
diff --git a/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/logs/debug-internal.log b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/logs/debug-internal.log
new file mode 100644
index 0000000000000000000000000000000000000000..5d4a91d552a492c44ec46baa0b184318111d7720
--- /dev/null
+++ b/pen_flow_matching/wandb/wandb/run-20251011_163844-a381qnn9/logs/debug-internal.log
@@ -0,0 +1,8 @@
+{"time":"2025-10-11T16:38:45.301569164Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
+{"time":"2025-10-11T16:38:46.459201786Z","level":"INFO","msg":"stream: created new stream","id":"a381qnn9"}
+{"time":"2025-10-11T16:38:46.459237957Z","level":"INFO","msg":"stream: started","id":"a381qnn9"}
+{"time":"2025-10-11T16:38:46.459266458Z","level":"INFO","msg":"handler: started","stream_id":"a381qnn9"}
+{"time":"2025-10-11T16:38:46.459291898Z","level":"INFO","msg":"sender: started","stream_id":"a381qnn9"}
+{"time":"2025-10-11T16:38:46.459287598Z","level":"INFO","msg":"writer: started","stream_id":"a381qnn9"}
+{"time":"2025-10-12T06:42:47.897888022Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/a381qnn9/file_stream","body":"\n\n\n502 Server Error\n\n\nError: Server Error
\nThe server encountered a temporary error and could not complete your request.
Please try again in 30 seconds.\n
\n\n"}
+{"time":"2025-10-12T14:34:32.120286068Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/a381qnn9/file_stream","body":"\n\n\n502 Server Error\n\n\nError: Server Error
\nThe server encountered a temporary error and could not complete your request.
Please try again in 30 seconds.\n
\n\n"}
diff --git a/wandb/wandb/debug.log b/wandb/wandb/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/wandb/wandb/run-20251002_155015-xojint20/logs/debug.log b/wandb/wandb/run-20251002_155015-xojint20/logs/debug.log
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/wandb/wandb/run-20251002_155442-6v8q0jgn/run-6v8q0jgn.wandb b/wandb/wandb/run-20251002_155442-6v8q0jgn/run-6v8q0jgn.wandb
new file mode 100644
index 0000000000000000000000000000000000000000..48e5cad1c12909a5b263508babce2356a9757bf9
--- /dev/null
+++ b/wandb/wandb/run-20251002_155442-6v8q0jgn/run-6v8q0jgn.wandb
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5fde97b8661375218dfdcc3b44c8c3b41daef8ad1b0db64eab868b94a1e2909d
+size 2490368